replication_package.zip
zenodo_data
Code-transformer
.env
950 Bytes
README.md
1.9 kB
binaries
.gitkeep
0 Bytes
JavaMethodExtractor-1.0.0-SNAPSHOT.jar
781.6 kB
java-parser-1.0-SNAPSHOT.jar
1.6 MB
semantic
114.2 MB
vocabularies.p.gzip
350.7 kB
code_transformer
__init__.py
0 Bytes
configuration
__init__.py
0 Bytes
attention.py
151 Bytes
code_transformer.py
1.8 kB
configuration_utils.py
1.0 kB
great_transformer.py
1.5 kB
transformer_lm_decoder.py
3.4 kB
transformer_lm_encoder.py
858 Bytes
env.py
2.3 kB
experiments
__init__.py
0 Bytes
code_transformer
__init__.py
0 Bytes
code_summarization.py
664 Bytes
code_summarization.yaml
6.0 kB
language_modeling.py
1.0 kB
language_modeling.yaml
2.0 kB
experiment.py
33.0 kB
great
__init__.py
0 Bytes
code_summarization.py
713 Bytes
code_summarization.yaml
1.7 kB
log.py
3.1 kB
mixins
__init__.py
0 Bytes
code_summarization.py
11.1 kB
code_summarization_great.py
5.3 kB
code_trans_lm.py
1.2 kB
code_trans_transformer.py
2.7 kB
great_transformer.py
2.8 kB
xl_net_lm.py
1.8 kB
xl_net_transformer.py
3.6 kB
paper
__init__.py
0 Bytes
ct_go.yaml
2.1 kB
ct_java_pretrain_lm.yaml
1.8 kB
ct_java_small.yaml
2.1 kB
ct_java_small_ablation_only_ancestor_sp.yaml
2.1 kB
ct_java_small_ablation_only_ppr.yaml
2.1 kB
ct_java_small_ablation_only_shortest_paths.yaml
2.1 kB
ct_java_small_ablation_only_sibling_sp.yaml
2.1 kB
ct_java_small_only_ast.yaml
2.1 kB
ct_java_small_pretrain.yaml
2.1 kB
ct_javascript.yaml
2.1 kB
ct_multilang.yaml
2.1 kB
ct_multilang_go.yaml
2.1 kB
ct_multilang_javascript.yaml
2.1 kB
ct_multilang_lm.yaml
1.8 kB
ct_multilang_lm_pretrain.yaml
2.1 kB
ct_multilang_python.yaml
2.1 kB
ct_multilang_ruby.yaml
2.1 kB
ct_no_pointer_go.yaml
2.1 kB
ct_no_pointer_java_small.yaml
2.1 kB
ct_no_pointer_java_small_only_ast.yaml
2.1 kB
ct_no_pointer_javascript.yaml
2.1 kB
ct_no_pointer_multilang.yaml
2.1 kB
ct_no_pointer_python.yaml
2.1 kB
ct_no_pointer_ruby.yaml
2.1 kB
ct_python.yaml
2.1 kB
ct_ruby.yaml
2.1 kB
great_go.yaml
1.5 kB
great_java_small.yaml
1.5 kB
great_javascript.yaml
1.5 kB
great_multilang.yaml
1.5 kB
great_python.yaml
1.5 kB
great_ruby.yaml
1.5 kB
xl_net_go.yaml
1.7 kB
xl_net_java_small.yaml
1.7 kB
xl_net_javascript.yaml
1.7 kB
xl_net_multilang.yaml
1.7 kB
xl_net_no_pointer_java_small.yaml
1.7 kB
xl_net_python.yaml
1.7 kB
xl_net_ruby.yaml
1.7 kB
preprocessing
__init__.py
0 Bytes
preprocess-1-code2seq.yaml
849 Bytes
preprocess-1-csn.yaml
864 Bytes
preprocess-1.py
8.7 kB
preprocess-2.py
16.2 kB
preprocess-2.yaml
892 Bytes
xl_net
__init__.py
0 Bytes
base.py
455 Bytes
code_summarization.py
589 Bytes
code_summarization.yaml
1.7 kB
language_modeling.py
437 Bytes
language_modeling.yaml
1.0 kB
modeling
__init__.py
0 Bytes
code_transformer
__init__.py
0 Bytes
code_transformer.py
37.5 kB
decoder.py
1.5 kB
distance_embeddings.py
2.3 kB
lm.py
14.8 kB
constants.py
2.7 kB
data_utils.py
5.5 kB
decoder
__init__.py
0 Bytes
pointer.py
9.7 kB
transformer.py
13.0 kB
great_transformer
__init__.py
0 Bytes
great_transformer.py
14.4 kB
transformer.py
1.9 kB
modelmanager
__init__.py
138 Bytes
base.py
4.2 kB
code_transformer.py
5.0 kB
great.py
3.6 kB
xl_net.py
3.2 kB
xl_net
__init__.py
0 Bytes
decoder.py
1.4 kB
xl_net_language_model.py
9.5 kB
preprocessing
README.md
482 Bytes
__init__.py
0 Bytes
datamanager
__init__.py
0 Bytes
base.py
11.9 kB
c2s
__init__.py
0 Bytes
raw.py
1.8 kB
csn
__init__.py
0 Bytes
raw.py
2.1 kB
preprocessed.py
15.2 kB
dataset
__init__.py
0 Bytes
ablation.py
6.5 kB
base.py
14.8 kB
code_summarization.py
23.9 kB
lm.py
9.4 kB
graph
__init__.py
0 Bytes
alg.py
4.2 kB
ast.py
5.9 kB
binning.py
5.6 kB
distances.py
11.3 kB
transform.py
5.4 kB
nlp
__init__.py
0 Bytes
javaparser.py
1.1 kB
semantic.py
5.1 kB
text.py
3.7 kB
tokenization.py
6.7 kB
vocab.py
9.3 kB
pipeline
__init__.py
0 Bytes
code2seq.py
8.8 kB
filter.py
12.7 kB
stage1.py
9.1 kB
stage2.py
3.3 kB
utils
__init__.py
0 Bytes
data.py
2.5 kB
inference.py
11.5 kB
io.py
1.1 kB
log.py
2.9 kB
loss.py
826 Bytes
metrics.py
17.6 kB
sacred.py
1.5 kB
timing.py
1.3 kB
vocab.py
1.1 kB
ct-env.yml
2.9 kB
data
stage2
.gitkeep
0 Bytes
figures
code_transformer_overview.png
96.3 kB
preprocessing_overview.png
111.4 kB
fine-tuning-experiments
calc_stats.py
1.9 kB
fine_tune_on_projects.py
3.1 kB
fine_tuning_config.yaml
2.0 kB
from_scratch_config.yaml
2.0 kB
from_scratch_reduced_config.yaml
2.0 kB
preprocess_projects.py
5.1 kB
test_model.py
6.3 kB
train_reduced_from_scratch.py
2.3 kB
images
.gitkeep
0 Bytes
logs
.gitkeep
0 Bytes
models
.gitkeep
0 Bytes
ct_code_summarization
CT-20
config.json
2.9 kB
snapshot-30000.p
454.4 MB
notebooks
deduplicate_java_pretrain.ipynb
12.1 kB
interactive_prediction.ipynb
15.4 kB
preprocessed
.gitkeep
0 Bytes
raw_java
.gitkeep
0 Bytes
requirements.txt
387 Bytes
results
.gitkeep
0 Bytes
scripts
code2seq
combine-vocabs-code2seq.sh
2.3 kB
preprocess-code2seq-helper.py
12.1 kB
preprocess-code2seq.py
3.6 kB
preprocess-code2seq.sh
2.9 kB
deduplicate-java-pretrain.py
5.7 kB
evaluate-multilanguage.py
9.7 kB
evaluate.py
9.1 kB
extract-java-methods.py
1.4 kB
run-experiment.py
623 Bytes
run-preprocessing.py
906 Bytes
setup.py
818 Bytes
sub_modules
code2seq
.gitignore
41 Bytes
CSharpExtractor
.gitattributes
2.5 kB
.gitignore
4.2 kB
CSharpExtractor
.nuget
packages.config
515 Bytes
CSharpExtractor.sln
2.4 kB
Extractor
Extractor.cs
8.3 kB
Extractor.csproj
521 Bytes
PathFinder.cs
2.6 kB
Program.cs
1.6 kB
Properties
launchSettings.json
208 Bytes
Temp.cs
176 Bytes
Tree
Tree.cs
9.8 kB
Utilities.cs
5.5 kB
Variable.cs
3.0 kB
extract.py
3.1 kB
Input.java
43 Bytes
JavaExtractor
JPredict
.classpath
1.1 kB
.gitignore
8 Bytes
src
main
java
JavaExtractor
App.java
2.2 kB
Common
CommandLineValues.java
1.6 kB
Common.java
2.5 kB
MethodContent.java
607 Bytes
ExtractFeaturesTask.java
2.8 kB
FeatureExtractor.java
8.0 kB
FeaturesEntities
ProgramFeatures.java
1.2 kB
ProgramRelation.java
446 Bytes
Property.java
8.3 kB
Visitors
FunctionVisitor.java
2.7 kB
LeavesCollectorVisitor.java
2.3 kB
Test.java
89 Bytes
extract.py
3.5 kB
LICENSE
1.1 kB
Python150kExtractor
README.md
1.6 kB
extract.py
5.4 kB
preprocess.sh
1.6 kB
README.md
16.4 kB
__init__.py
0 Bytes
baseline_tokenization
input_example.txt
583 Bytes
javalang
__init__.py
113 Bytes
ast.py
1.8 kB
javadoc.py
2.9 kB
parse.py
1.1 kB
parser.py
73.7 kB
test
__init__.py
0 Bytes
source
package-info
AnnotationJavadoc.java
95 Bytes
AnnotationOnly.java
35 Bytes
JavadocAnnotation.java
95 Bytes
JavadocOnly.java
86 Bytes
NoAnnotationNoJavadoc.java
26 Bytes
test_java_8_syntax.py
8.7 kB
test_javadoc.py
305 Bytes
test_package_declaration.py
2.0 kB
test_util.py
1.9 kB
tokenizer.py
17.0 kB
tree.py
6.8 kB
util.py
4.2 kB
subtokenize_nmt_baseline.py
1.6 kB
code2seq.py
2.0 kB
common.py
5.8 kB
config.py
3.6 kB
evaluate.sh
893 Bytes
extractor.py
1.7 kB
images
network.png
68.0 kB
interactive_predict.py
2.5 kB
model.py
48.1 kB
preprocess.py
6.2 kB
preprocess.sh
4.3 kB
preprocess_csharp.sh
4.5 kB
reader.py
17.9 kB
train.sh
828 Bytes
train_python150k.sh
427 Bytes
java-method-extractor
.classpath
1.1 kB
JavaExtractor (1).iml
315 Bytes
JavaExtractor.iml
1.5 kB
JavaMethodExtractor.iml
1.1 kB
code-2-seq-java-extractor.iml
1.2 kB
dependency-reduced-pom.xml
1.4 kB
extract.py
3.5 kB
pom.xml
3.7 kB
src
main
JavaExtractor
App.java
2.2 kB
Common
CommandLineValues.java
1.4 kB
Common.java
2.5 kB
MethodContent.java
460 Bytes
ExtractFeaturesTask.java
2.6 kB
FeatureExtractor.java
1.9 kB
FeaturesEntities
ProgramFeatures.java
1.0 kB
ProgramRelation.java
501 Bytes
Property.java
8.3 kB
Visitors
FunctionVisitor.java
2.8 kB
LeavesCollectorVisitor.java
2.3 kB
java
CommandLineValues.java
1.2 kB
ExtractMethodsTask.java
2.5 kB
JavaMethodExtractor.java
5.0 kB
MethodContent.java
444 Bytes
MethodVisitor.java
2.3 kB
target
JavaMethodExtractor-1.0.0-SNAPSHOT.jar
781.6 kB
java-parser
java-parser.iml
1.4 kB
java-parser.iws
20.9 kB
pom.xml
2.9 kB
src
main
java
ASTNode.java
1.3 kB
ASTParser.java
7.1 kB
META-INF
MANIFEST.MF
45 Bytes
target
java-parser-1.0-SNAPSHOT.jar
1.6 MB
tests
modeling
code_transformer
test_code_transformer.py
39.4 kB
great
test_great.py
3.2 kB
xl_net
test_xl_net.py
4.5 kB
preprocessing
binning.py
5.7 kB
test_loss.py
2.3 kB
test_metrics.py
9.7 kB
Code2seq-and-Treelstm
README.md
1.9 kB
cloned_repos
.gitkeep
0 Bytes
configs
code2seq_config.yaml
967 Bytes
code2seq_vocabulary.pkl
1.4 MB
psiminer_code2seq_config.json
864 Bytes
psiminer_treelstm_config.json
838 Bytes
treelstm_config.yaml
826 Bytes
treelstm_vocabulary.pkl
1.3 MB
dependencies
.gitkeep
0 Bytes
Miner
README.md
566 Bytes
build.gradle
1.6 kB
detekt.yml
17.4 kB
gradle
wrapper
gradle-wrapper.jar
59.2 kB
gradle-wrapper.properties
202 Bytes
gradlew
5.8 kB
gradlew.bat
2.8 kB
miner-core
build.gradle
228 Bytes
src
main
kotlin
org
miner
dataset
DatasetSample.kt
465 Bytes
package-info.java
18 Bytes
processors
CodeCommentDiffs.kt
19.0 kB
CodeCommentTokenizer.kt
4.5 kB
MethodChangesExtractor.kt
4.7 kB
ProjectMethodExtractor.kt
6.1 kB
RefactoringExtractor.kt
4.3 kB
utils
GitUtils.kt
546 Bytes
MethodUtils.kt
802 Bytes
PsiUtils.kt
2.8 kB
RefactoringUtils.kt
2.9 kB
miner-headless
build.gradle.kts
1.2 kB
src
main
kotlin
PluginRunner.kt
10.8 kB
RawSampleWriter.kt
921 Bytes
StatisticHandler.kt
1.1 kB
StatisticWriter.kt
634 Bytes
resources
META-INF
plugin.xml
830 Bytes
MinerBundle.properties
53 Bytes
inspectionDescriptions
CodeComment.html
58 Bytes
run_miner.sh
574 Bytes
settings.gradle
85 Bytes
psiminer
.git
HEAD
23 Bytes
branches
config
275 Bytes
description
73 Bytes
hooks
applypatch-msg.sample
478 Bytes
commit-msg.sample
896 Bytes
fsmonitor-watchman.sample
4.7 kB
post-update.sample
189 Bytes
pre-applypatch.sample
424 Bytes
pre-commit.sample
1.6 kB
pre-merge-commit.sample
416 Bytes
pre-push.sample
1.4 kB
pre-rebase.sample
4.9 kB
pre-receive.sample
544 Bytes
prepare-commit-msg.sample
1.5 kB
push-to-checkout.sample
2.8 kB
update.sample
3.6 kB
index
12.7 kB
info
exclude
240 Bytes
logs
HEAD
193 Bytes
refs
heads
master
193 Bytes
remotes
origin
HEAD
193 Bytes
objects
info
pack
pack-8f1c89f75e41a887c91e9e7793a383a690dd1f48.idx
78.5 kB
pack-8f1c89f75e41a887c91e9e7793a383a690dd1f48.pack
541.6 kB
packed-refs
301 Bytes
refs
heads
master
41 Bytes
remotes
origin
HEAD
32 Bytes
tags
.github
workflows
main.yml
2.4 kB
.gitignore
92 Bytes
.idea
.gitignore
176 Bytes
runConfigurations
Run_on_test_data__java_.xml
1.1 kB
Run_on_test_data__kotlin_.xml
1.1 kB
Run_unit_tests.xml
917 Bytes
LICENSE
11.3 kB
README.md
4.4 kB
build.gradle.kts
2.5 kB
configs
java_ast_methods.json
828 Bytes
java_paths_methods.json
843 Bytes
kotlin_ast_methods.json
323 Bytes
detekt.yml
701 Bytes
docs
filters.md
2.0 kB
label_extractors.md
919 Bytes
preprocessing.md
994 Bytes
storages.md
2.3 kB
tree_transormations.md
5.2 kB
gradle
wrapper
gradle-wrapper.jar
58.7 kB
gradle-wrapper.properties
202 Bytes
gradle.properties
358 Bytes
gradlew
5.8 kB
gradlew.bat
2.9 kB
psiminer-cli
build.gradle.kts
674 Bytes
src
main
kotlin
PluginRunner.kt
4.2 kB
config
Config.kt
745 Bytes
FilterConfigs.kt
1.8 kB
LabelExtractorConfigs.kt
472 Bytes
PreprocessingConfigs.kt
865 Bytes
PsiNodeExcludeTreeTransformationConfigs.kt
2.3 kB
PsiTreeTransformationConfigs.kt
2.4 kB
StorageConfigs.kt
1.4 kB
resources
META-INF
plugin.xml
793 Bytes
log4j.properties
618 Bytes
psiminer-core
build.gradle.kts
297 Bytes
src
main
kotlin
Common.kt
1.8 kB
Pipeline.kt
4.4 kB
RepositoryOpener.kt
1.7 kB
filter
CodeLinesFilter.kt
791 Bytes
Filter.kt
426 Bytes
MethodFilters.kt
1.5 kB
TreeSizeFilter.kt
613 Bytes
labelextractor
LabelExtractor.kt
1.2 kB
MethodNameLabelExtractor.kt
883 Bytes
psi
Parser.kt
2.0 kB
Utils.kt
2.8 kB
language
JavaHandler.kt
1.1 kB
KotlinHandler.kt
1.8 kB
LanguageHandler.kt
1.3 kB
method
JavaMethodProvider.kt
1.1 kB
KotlinMethodProvider.kt
1.6 kB
MethodProvider.kt
428 Bytes
nodeProperties
IsHidden.kt
208 Bytes
NodeType.kt
274 Bytes
Token.kt
738 Bytes
transformations
JavaCompressOperatorTransformation.kt
1.4 kB
JavaHideLiteralsTransformation.kt
1.8 kB
JavaRemoveCommentsTransformation.kt
805 Bytes
PsiTreeTransformation.kt
315 Bytes
excludenode
ExcludeNodeTransformation.kt
668 Bytes
ExcludeWhiteSpaceTransformation.kt
296 Bytes
JavaExcludeNodeTransformations.kt
1.9 kB
typeresolve
JavaResolveTypeTransformation.kt
2.6 kB
resolvedTokenType.kt
1.1 kB
storage
Storage.kt
1.5 kB
paths
AstminerNodeWrapper.kt
663 Bytes
Code2SeqStorage.kt
4.3 kB
tree
JsonTreeStorage.kt
2.5 kB
test
kotlin
BasePsiRequiredTest.kt
2.6 kB
CommonTest.kt
775 Bytes
filter
AnnotationFilterTest.kt
1.7 kB
CodeLinesFilterTest.kt
1.7 kB
ConstructorFilterTest.kt
866 Bytes
EmptyMethodFilterTest.kt
1.8 kB
ModifierFilterTest.kt
1.5 kB
TreeSizeFilterTest.kt
1.7 kB
labelextractor
methodname
JavaMethodNameLabelExtractorTest.kt
2.7 kB
KotlinMethodNameLabelExtractorTest.kt
2.8 kB
psi
transformations
JavaHideLiteralsTransformationTest.kt
2.1 kB
excludenode
ExcludeWhiteSpaceTransformationTest.kt
513 Bytes
JavaExcludeKeywordTransformationTest.kt
272 Bytes
JavaExcludeTransformationTest.kt
1.1 kB
KotlinExcludeTransformationTest.kt
1.1 kB
typeresolve
JavaResolveTypeTransformationTest.kt
1.9 kB
resources
data
java
JavaAnnotatedMethods.java
249 Bytes
JavaEmptyMethods.java
865 Bytes
JavaMethods.java
1.2 kB
kotlin
KotlinAnnotatedMethods.kt
226 Bytes
KotlinEmptyMethods.kt
824 Bytes
KotlinMethods.kt
1.1 kB
log4j.properties
330 Bytes
psiminer.sh
454 Bytes
settings.gradle.kts
317 Bytes
experiments
fine_tune_and_calc_results.py
4.0 kB
repos_to_model_input.py
1.9 kB
summarize_results.py
3.3 kB
extracted_methods
.gitkeep
0 Bytes
ft_env.yml
2.8 kB
models
code2seq.ckpt
62.1 MB
fine-tuning-experiments
.gitkeep
0 Bytes
treelstm.ckpt
76.9 MB
requirements.txt
313 Bytes
results
.gitkeep
0 Bytes
scripts
__init__.py
0 Bytes
code2seq
__init__.py
0 Bytes
dump_results.py
2.2 kB
fine_tune.py
5.3 kB
test_single.py
1.1 kB
preprocessing
__init__.py
0 Bytes
clone_repos.py
646 Bytes
mine_method_updates.py
1.1 kB
preprocess.py
4.4 kB
split_mined_methods.py
2.9 kB
save_metrics.py
2.7 kB
treelstm
__init__.py
0 Bytes
dump_results.py
2.3 kB
fine_tune.py
5.2 kB
test_single.py
838 Bytes
utils.py
1.2 kB
Miner
README.md
566 Bytes
build.gradle
1.6 kB
detekt.yml
17.4 kB
gradle
wrapper
gradle-wrapper.jar
59.2 kB
gradle-wrapper.properties
202 Bytes
gradlew
5.8 kB
gradlew.bat
2.8 kB
miner-core
build.gradle
228 Bytes
src
main
kotlin
org
miner
dataset
DatasetSample.kt
465 Bytes
package-info.java
18 Bytes
processors
CodeCommentDiffs.kt
19.0 kB
CodeCommentTokenizer.kt
4.5 kB
MethodChangesExtractor.kt
4.7 kB
ProjectMethodExtractor.kt
6.1 kB
RefactoringExtractor.kt
4.3 kB
utils
GitUtils.kt
546 Bytes
MethodUtils.kt
802 Bytes
PsiUtils.kt
2.8 kB
RefactoringUtils.kt
2.9 kB
miner-headless
build.gradle.kts
1.2 kB
src
main
kotlin
PluginRunner.kt
10.8 kB
RawSampleWriter.kt
921 Bytes
StatisticHandler.kt
1.1 kB
StatisticWriter.kt
634 Bytes
resources
META-INF
plugin.xml
830 Bytes
MinerBundle.properties
53 Bytes
inspectionDescriptions
CodeComment.html
58 Bytes
run_miner.sh
574 Bytes
settings.gradle
85 Bytes