Skip to content

Commit c0db1fd

Browse files
2 parents b757b66 + 6c72783 commit c0db1fd

10 files changed

Lines changed: 728 additions & 10 deletions

File tree

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ Its role is to mine repositories (from the Apache Software Project) to see how m
1212

1313
## Installing
1414

15-
1. Ensure **Python 3.10.x** or higher is installed
15+
1. Ensure **Python 3.9.x** or higher is installed
1616

1717
2. Clone project
1818
Clone the repository locally, or download and extract the ZIP file.

requirements.txt

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,4 +2,5 @@ pydriller~=2.7
22
pytest
33
pytest-asyncio
44
matplotlib~=3.9.4
5-
tqdm
5+
tqdm
6+
requests

resources/repositories/java_repos.txt

Lines changed: 336 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -181,4 +181,339 @@ xalan-j
181181
xmlbeans
182182
xmlgraphics-batik
183183
xmlgraphics-fop
184-
zookeeper
184+
zookeeper
185+
xalan-j
186+
directory-studio
187+
maven-resources
188+
xmlgraphics-fop
189+
maven-scm
190+
directory-samples
191+
maven-release
192+
synapse
193+
maven-mercury
194+
cayenne
195+
commons-collections
196+
openjpa
197+
mina
198+
poi
199+
nutch
200+
commons-codec
201+
maven-shared
202+
commons-lang
203+
jsecurity
204+
activemq
205+
xmlgraphics-commons
206+
struts1
207+
commons-io
208+
httpcomponents-core
209+
maven-doxia-sitetools
210+
struts-sandbox
211+
httpcomponents-client
212+
jackrabbit
213+
sanselan
214+
continuum
215+
maven-ant-tasks
216+
maven-plugin-testing
217+
cassandra
218+
directory-server
219+
xmlgraphics-batik
220+
roller
221+
maven-artifact
222+
maven-doxia
223+
abdera
224+
maven
225+
commons-logging
226+
commons-cli
227+
servicemix4-nmr
228+
servicemix-archetypes
229+
servicemix4-bundles
230+
servicemix4-kernel
231+
servicemix4-features
232+
servicemix3
233+
servicemix-utils
234+
servicemix-maven-plugins
235+
servicemix4-specs
236+
geronimo-specs
237+
geronimo-xbean
238+
geronimo-yoko
239+
geronimo-javamail
240+
wink
241+
xmlbeans
242+
activemq-activeio
243+
pdfbox
244+
aries
245+
tuscany-sca-1.x
246+
tuscany-das
247+
tuscany-sdo
248+
tuscany-sca-2.x
249+
maven-2
250+
myfaces-scripting
251+
ace
252+
mina-sshd
253+
tomcat55
254+
karaf
255+
maven-surefire
256+
commons-validator
257+
webservices-commons-xmlschema
258+
myfaces-extcdi
259+
myfaces-extval
260+
xerces2-j
261+
servicemix-components
262+
geronimo-txmanager
263+
openwebbeans
264+
geronimo-devtools
265+
geronimo-jaspi
266+
bval
267+
clerezza
268+
incubator-kie-optaplanner
269+
incubator-kie-drools
270+
bookkeeper
271+
hcatalog
272+
ftpserver
273+
karaf-cellar
274+
sqoop
275+
kandula
276+
logging-flume
277+
sandesha
278+
rampart
279+
savan
280+
pivot
281+
giraph
282+
tomcat-maven-plugin
283+
oozie
284+
tomcat
285+
accumulo
286+
commons-fileupload
287+
httpasyncclient
288+
commons-compress
289+
archiva-sandbox
290+
kalumet
291+
maven-app-engine
292+
opennlp
293+
james-jspf
294+
james-mime4j
295+
chemistry-opencmis
296+
jackrabbit-oak
297+
archiva-redback-components
298+
tiles-request
299+
tiles-autotag
300+
dubbo
301+
james-postage
302+
james-jdkim
303+
james-jsieve
304+
odftoolkit
305+
royale-compiler
306+
drill
307+
directmemory-lightning
308+
cassandra-java-driver
309+
commons-net
310+
jena
311+
incubator-retired-hdt
312+
tomee
313+
openejb
314+
predictionio-sdk-java
315+
commons-configuration
316+
incubator-stormcrawler
317+
ode-jacob
318+
oltu
319+
deltaspike
320+
sis
321+
commons-beanutils
322+
commons-csv
323+
incubator-retired-provisionr
324+
incubator-tez
325+
logging-log4j2
326+
fluo
327+
commons-pool
328+
commons-dbcp
329+
commons-jcs
330+
commons-jelly
331+
commons-jexl
332+
commons-jxpath
333+
commons-ognl
334+
commons-proxy
335+
commons-functor
336+
commons-imaging
337+
commons-jci
338+
commons-chain
339+
commons-dbutils
340+
commons-digester
341+
commons-bcel
342+
commons-vfs
343+
metamodel
344+
manifoldcf-integration-solr-3.x
345+
manifoldcf-integration-solr-4.x
346+
incubator-sentry
347+
commons-weaver
348+
incubator-batchee
349+
velocity-engine
350+
velocity-tools
351+
uima-uimaj
352+
uima-addons
353+
uima-sandbox
354+
uima-uimafit
355+
incubator-retired-wave
356+
jclouds
357+
jackrabbit-filevault
358+
jackrabbit-ocm
359+
cxf
360+
curator
361+
cxf-build-utils
362+
cxf-dosgi
363+
cxf-fediz
364+
cxf-xjc-utils
365+
servicemix
366+
archiva-redback-core
367+
olingo-odata2
368+
olingo-odata4
369+
maven-indexer
370+
flex-blazeds
371+
gora
372+
pinot
373+
hbase
374+
portals-pluto
375+
ant-antlibs-compress
376+
ant-antlibs-dotnet
377+
ant-antlibs-props
378+
ant-antlibs-vss
379+
ant-ivyde
380+
phoenix
381+
parquet-java
382+
ant-easyant-tasks
383+
incubator-optiq-linq4j
384+
calcite
385+
activemq-openwire
386+
ddlutils
387+
johnzon
388+
qpid-jms
389+
commons-math
390+
karaf-decanter
391+
xmlgraphics-fop-pdf-images
392+
tomcat80
393+
commons-text
394+
incubator-retired-tamaya
395+
gobblin
396+
incubator-samoa
397+
incubator-taverna-commandline
398+
incubator-taverna-common-activities
399+
incubator-taverna-engine
400+
incubator-taverna-language
401+
incubator-taverna-osgi
402+
incubator-taverna-server
403+
incubator-taverna-workbench-common-activities
404+
incubator-taverna-workbench
405+
asterixdb
406+
servicemix-bundles
407+
servicemix-specs
408+
struts-annotations
409+
clerezza-rdf-core
410+
directory-kerby
411+
commons-rdf
412+
asterixdb-hyracks
413+
polygene-sandbox
414+
dubbo-rpc-jsonrpc
415+
activemq-artemis
416+
datasketches-hive
417+
datasketches-pig
418+
datasketches-java
419+
nifi-maven
420+
apex-core
421+
incubator-retired-wave-android
422+
fluo-recipes
423+
shardingsphere-elasticjob
424+
incubator-retired-horn
425+
directory-fortress-core
426+
directory-fortress-enmasse
427+
rya
428+
skywalking
429+
unomi
430+
brooklyn-library
431+
brooklyn-server
432+
aries-rsa
433+
nifi-minifi
434+
cordova-plugin-compat
435+
incubator-kie-benchmarks
436+
phoenix-omid
437+
karaf-boot
438+
incubator-taverna-plugin-gis
439+
incubator-retired-gossip
440+
phoenix-tephra
441+
pulsar
442+
twill
443+
commons-rng
444+
incubator-twill
445+
incubator-retired-tamaya-extensions
446+
incubator-retired-tamaya-sandbox
447+
usergrid-android
448+
usergrid-java
449+
asterixdb-bad
450+
maven-resolver
451+
incubator-hivemall
452+
opennlp-addons
453+
opennlp-sandbox
454+
commons-numbers
455+
accumulo-bsp
456+
accumulo-instamo-archetype
457+
accumulo-pig
458+
accumulo-wikisearch
459+
aries-jax-rs-whiteboard
460+
rocketmq
461+
accumulo-examples
462+
geode-examples
463+
cayenne-modeler
464+
logging-log4j-boot
465+
ratis
466+
activemq-cli-tools
467+
qpid-jms-amqp-0-x
468+
freemarker-online-tester
469+
activemq-nms-openwire-generator
470+
datasketches-memory
471+
struts-extras
472+
calcite-avatica
473+
aries-jpa
474+
servicecomb-java-chassis
475+
aries-containers
476+
httpcomponents-stylecheck
477+
geronimo-config
478+
metamodel-membrane
479+
seatunnel
480+
directory-ldap-api
481+
netbeans-html4j
482+
geronimo-safeguard
483+
jackrabbit-filevault-package-maven-plugin
484+
shardingsphere-example
485+
datasketches-vector
486+
pdfbox-jbig2
487+
sling-org-apache-sling-api
488+
sling-org-apache-sling-auth-core
489+
sling-org-apache-sling-auth-form
490+
sling-org-apache-sling-commons-classloader
491+
sling-org-apache-sling-commons-compiler
492+
sling-org-apache-sling-commons-contentdetection
493+
sling-org-apache-sling-commons-johnzon
494+
sling-org-apache-sling-commons-log
495+
sling-org-apache-sling-commons-logservice
496+
sling-org-apache-sling-commons-metrics
497+
sling-org-apache-sling-commons-metrics-rrd4j
498+
sling-org-apache-sling-commons-mime
499+
sling-org-apache-sling-commons-messaging-mail
500+
sling-org-apache-sling-commons-messaging
501+
sling-org-apache-sling-commons-osgi
502+
sling-org-apache-sling-commons-scheduler
503+
sling-org-apache-sling-commons-threaddump
504+
sling-org-apache-sling-commons-threads
505+
sling-org-apache-sling-engine
506+
sling-org-apache-sling-adapter
507+
sling-org-apache-sling-bundleresource-impl
508+
sling-org-apache-sling-caconfig-api
509+
sling-org-apache-sling-caconfig-impl
510+
sling-org-apache-sling-caconfig-integration-tests
511+
sling-org-apache-sling-caconfig-spi
512+
sling-org-apache-sling-event-dea
513+
sling-org-apache-sling-discovery-api
514+
sling-org-apache-sling-discovery-base
515+
sling-org-apache-sling-discovery-commons
516+
sling-org-apache-sling-discovery-impl
517+
sling-org-apache-sling-discovery-oak
518+
sling-org-apache-sling-discovery-standalone
519+
sling-org-apache-sling-discovery-support

resources/repositories/python_repos.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,4 +18,3 @@ pulsar
1818
nifi
1919
cassandra
2020
mahout
21-
polaris
Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,2 @@
11
arrow
22
teaclave
3-
iceberg
4-
datafusion
5-
dubbo

src/mining/csv_export.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
AUTHOR_CSV_PATH = os.path.join(file_utils.RESULTS_PATH, f"{AUTHOR_FILE_NAME}.csv")
77
REPO_CSV_PATH = os.path.join(file_utils.RESULTS_PATH, "repo_data.csv")
88

9-
REPO_HEADER = ["Repo Name", "Language", "Commit Count", "Test Before", "Test After", "Test During", "Duration (s)",
9+
REPO_HEADER = ["Repo Name", "Language", "Test Before", "Test After", "Test During", "Duration (s)",
1010
"Avg Before Commit Size", "Avg After Commit Size", "Avg During Commit Size", "Avg Commit Size"]
1111

1212
AUTHOR_HEADER = ["Author", "Test Before", "Test After", "Test During"]

0 commit comments

Comments
 (0)