Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
42 commits
Select commit Hold shift + click to select a range
f1bcd02
Add -N option to wget of genome-fetcher.py
Lucioric2000 May 17, 2019
b43a194
Add the -N option to wget in the Java code
Lucioric2000 May 17, 2019
47f4cbe
Added existance in destination testing for files being downloaded
May 17, 2019
d3ee25e
Fix style, and add MongoDB installer
May 17, 2019
0930039
Added file size comparizon in redownload intelligent avouder
May 18, 2019
e07e140
Fixed some typos
May 18, 2019
4a18aa7
Fixed other typos
May 18, 2019
76def55
Fix typos (3)
May 18, 2019
56afa9d
Fix style typo (4)
May 18, 2019
0616742
Add references previously missed to import
May 18, 2019
5b9982e
Mudyfy pom.xml co include apache commons net
May 18, 2019
f953036
Moify pom.xml
May 18, 2019
b4ebf85
Cmt
May 18, 2019
7ea7a64
Cmt
May 18, 2019
67b0fec
Cmt
May 18, 2019
8cc94e0
Java code stable
May 18, 2019
ba6e5e8
Cmt
Lucioric2000 Jul 19, 2020
f2a5d1f
Merge remote-tracking branch 'origin/master' into HEAD
Lucioric2000 Jul 19, 2020
0b5f9be
Commit
Lucioric2000 Sep 15, 2020
85c0f46
Merge branch 'master' of https://github.com/opencb/cellbase
Lucioric2000 Oct 19, 2020
6d12699
Merge branch 'master' of https://github.com/Lucioric2000/cellbase
Lucioric2000 Oct 19, 2020
136a7a4
Commit
Lucioric2000 Oct 19, 2020
85d02c8
Commit
Lucioric2000 Oct 21, 2020
f874cca
Commit
Lucioric2000 Oct 21, 2020
a695c34
Merge branch 'new-branch-name'
Lucioric2000 Oct 21, 2020
1f8f4a3
Commit
Lucioric2000 Oct 21, 2020
df637c7
Merge branch 'master' of https://github.com/Lucioric2000/cellbase
Lucioric2000 Oct 21, 2020
653dc78
Commit
Lucioric2000 Oct 21, 2020
52938f0
Commit
Lucioric2000 Oct 21, 2020
b7f3736
Merge branch 'master' of https://github.com/Lucioric2000/cellbase
Lucioric2000 Oct 21, 2020
ae5b091
Commit
Lucioric2000 Oct 21, 2020
ba50615
ommit
Lucioric2000 Oct 21, 2020
35c7f83
Commit
Lucioric2000 Oct 21, 2020
d4a2065
Commit
Lucioric2000 Oct 21, 2020
e5ac9c1
Merge branch 'master' of https://github.com/Lucioric2000/cellbase
Lucioric2000 Oct 21, 2020
8348d64
Commit
Lucioric2000 May 2, 2021
560b2ba
Commit
Lucioric2000 May 2, 2021
db38b11
Merge branch 'master' of https://github.com/Lucioric2000/cellbase
Lucioric2000 May 2, 2021
0d9f80b
Commit
Lucioric2000 May 2, 2021
1a3a13e
Commit
Lucioric2000 May 2, 2021
f5c7e28
Commit
Lucioric2000 May 2, 2021
23b468b
Commit
Lucioric2000 May 7, 2021
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
The table of contents is too big for display.
Diff view
Diff view
  •  
  •  
  •  
Empty file modified .gitignore
100644 → 100755
Empty file.
2 changes: 1 addition & 1 deletion .gitmodules
100644 → 100755
Original file line number Diff line number Diff line change
@@ -1,3 +1,3 @@
[submodule "cellbase-web/lib/jsorolla"]
path = cellbase-web/lib/jsorolla
url = https://github.com/opencb/jsorolla.git
url = https://github.com/Lucioric2000/jsorolla.git
Empty file modified LICENSE
100644 → 100755
Empty file.
Empty file modified README.md
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/bin/obsolete/gene-chunkIds.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/bin/obsolete/genome-fetcher/CHECKSUMS
100644 → 100755
Empty file.
10 changes: 5 additions & 5 deletions cellbase-app/app/bin/obsolete/genome-fetcher/genome-fetcher.py
Original file line number Diff line number Diff line change
Expand Up @@ -101,15 +101,15 @@
logging.debug(sp_obj['assembly'])
outfile = sequence_folder+"/"+sp_short.capitalize() + ".{0}".format(sp_obj['assembly'])+".fa.gz"
logging.debug(outfile)
command = "wget --tries=10 " + url_seq +" -O '"+outfile+"' -o "+outfile+".log"
command = "wget -N --tries=10 " + url_seq +" -O '"+outfile+"' -o "+outfile+".log"
logging.debug(command)
os.system(command)
cmd = "./genome_info.pl --species '{0}' -o {1}/genome_info.json".format(sp, sequence_folder)
logging.debug(cmd)
os.system(cmd)
# for i in sp_obj['chromosomes']:
# outfile = seq_folder+"/chrom_"+i+".fa.gz"
# command = "wget --tries=10 " + url_seq+"/*.dna.chromosome."+i+".fa.gz -O '"+outfile+"' -o "+outfile+".log"
# command = "wget -N --tries=10 " + url_seq+"/*.dna.chromosome."+i+".fa.gz -O '"+outfile+"' -o "+outfile+".log"
# logging.debug(command)
# os.system(command)

Expand All @@ -121,7 +121,7 @@
url_gtf = sp_obj['sequence_url'].replace("fasta", "gtf")+"{0}".format(sp_short)
logging.debug(url_gtf)
outfile = gene_folder+"/"+sp_short+".gtf.gz"
command = "wget --tries=10 " + url_gtf+"/*.gtf.gz -O '"+outfile+"' -o "+outfile+".log"
command = "wget -N --tries=10 " + url_gtf+"/*.gtf.gz -O '"+outfile+"' -o "+outfile+".log"
logging.debug(command)
os.system(command)
if sp_obj['phylo'] is not 'Bacteria':
Expand Down Expand Up @@ -159,7 +159,7 @@
variation_url = sp_obj['variation_url']
for file in variation_files:
outfile = variation_folder+"/"+file
command = "wget --tries=10 " + variation_url+"/"+file+" -O '"+outfile+"' -o "+outfile+".log"
command = "wget -N --tries=10 " + variation_url+"/"+file+" -O '"+outfile+"' -o "+outfile+".log"
logging.debug(command)
os.system(command)

Expand All @@ -172,7 +172,7 @@
regulation_url = sp_obj['regulation_url']+sp_short
for file in regulation_files:
outfile = regulation_folder+"/"+file
command = "wget --tries=10 " + regulation_url+"/"+file+" -O '"+outfile+"' -o "+outfile+".log"
command = "wget -N --tries=10 " + regulation_url+"/"+file+" -O '"+outfile+"' -o "+outfile+".log"
logging.debug(command)
os.system(command)

Expand Down
Empty file modified cellbase-app/app/bin/obsolete/genome-fetcher/species.json
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/bin/obsolete/genome-fetcher/species_info.json
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/bin/obsolete/genome-fetcher/species_info.txt
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/bin/obsolete/variation-chunkIds.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/example/5000_variants.vcf.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/example/BasicTest.Json
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/example/BasicTest.gvf
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/example/Escherichia coli.owl
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/add_database_roles_mongo.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/clinical-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/clinical-legacy-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/conservation-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/create-biouser.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/drugbank-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/gene-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/genome_sequence-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/grant-users.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/mutation-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/protein-indexes.js
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/regulatory_region-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/repeat-indexes.js
100644 → 100755
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/variation-indexes.js
100644 → 100755
Empty file.
Empty file.
Empty file modified cellbase-app/app/mongodb-scripts/variation_phenotype-indexes.js
100644 → 100755
Empty file.
Empty file.
5 changes: 5 additions & 0 deletions cellbase-app/pom.xml
100644 → 100755
Original file line number Diff line number Diff line change
Expand Up @@ -47,6 +47,11 @@
<artifactId>commons-io</artifactId>
<version>2.4</version>
</dependency>
<dependency>
<groupId>commons-net</groupId>
<artifactId>commons-net</artifactId>
<version>${commons-net.version}</version>
</dependency>
<dependency>
<groupId>org.spockframework</groupId>
<artifactId>spock-core</artifactId>
Expand Down
Empty file.
Empty file.
Empty file.
Empty file.
21 changes: 21 additions & 0 deletions cellbase-app/src/main/java/org/opencb/cellbase/app/cli/DownloadCommandExecutor.java
100644 → 100755
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,8 @@
import org.apache.commons.collections.map.HashedMap;
import org.apache.commons.io.FilenameUtils;
import org.apache.commons.io.IOUtils;
import org.apache.commons.net.ftp.FTPClient;
import org.apache.commons.net.ftp.FTPFile;
import org.apache.commons.lang.StringUtils;
import org.opencb.cellbase.core.config.Species;
import org.opencb.commons.utils.FileUtils;
Expand Down Expand Up @@ -1165,6 +1167,25 @@ private void downloadFile(String url, String outputFileName) throws IOException,
private void downloadFile(String url, String outputFileName, List<String> wgetAdditionalArgs)
throws IOException, InterruptedException {

File file = new File(outputFileName);
if (file.exists()) {
FTPClient ftpClient = new FTPClient();
// code to connect and login....

FTPFile remotefile = ftpClient.mlistFile(outputFileName);
long remotesize = remotefile.getSize();
long localsize = file.length();
long locallastmodified = file.lastModified();
logger.info("File " + outputFileName + " exists, with size " + localsize + " vs "
+ remotesize + " in remote and will not be downloaded again");
if (remotesize == localsize) {
logger.info("Download avoided because the files have the same size");
return;
}
//If the filestamps differ, regardless of the timestamps downloads the file
Calendar remotets = remotefile.getTimestamp();
logger.info("local ts " + locallastmodified + "wheras remote ts is " + remotets.toString());
}
List<String> wgetArgs = new ArrayList<>(Arrays.asList("--tries=10", url, "-O", outputFileName, "-o",
outputFileName + ".log"));
if (wgetAdditionalArgs != null && !wgetAdditionalArgs.isEmpty()) {
Expand Down
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@ public class DOCMIndexer extends ClinicalIndexer {
private static final String DISEASE = "disease";
private static final String SOURCE_PUBMED_ID = "source_pubmed_id";
private static final String PMID = "PMID:";
private static final String URL_PREFIX = "http://docm.genome.wustl.edu/variants/";
private static final String URL_PREFIX = "http://docm.info/variants/";
private static final String HGVS = "hgvs";
private static final String GENE = "gene";
private static final String TRANSCRIPT = "transcript";
Expand Down
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-app/src/test/resources/caddTest.tsv.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/caddTest.tsv.gz.tbi
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/cadd_example.txt.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/clinvarExample.xml
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-app/src/test/resources/cosmicTest.csv
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/dbSnpTest.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/dbSnpTest.gz.tbi
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/dgv.json.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/dgv.txt.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/disGeNetTest.csv
100644 → 100755
Empty file.
Empty file.
Empty file modified cellbase-app/src/test/resources/ebolaGenome/Ebola_virus.gtf.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/entrezIdToEnsemblIdTest.csv
100644 → 100755
Empty file.
Empty file.
Empty file modified cellbase-app/src/test/resources/geneParser/MotifFeatures.gff.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/geneParser/homo_sapiens.gtf
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/geneParser/tfbs.txt
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/gwasTest.csv
100644 → 100755
Empty file.
Empty file.
Empty file modified cellbase-app/src/test/resources/regulation/motiffeatures.gff.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/repeats/genomicSuperDups.txt.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/repeats/repeats.test.json.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/repeats/simpleRepeat.txt.gz
100644 → 100755
Empty file.
Empty file modified cellbase-app/src/test/resources/repeats/windowMasker.txt.gz
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-app/src/test/resources/variationParser/source.txt.gz
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-app/src/test/resources/vep-example-output.txt
100644 → 100755
Empty file.
Empty file modified cellbase-client/pom.xml
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-client/src/main/resources/client-configuration.yml
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file modified cellbase-core/pom.xml
100644 → 100755
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Empty file.
Loading