Skip to content

Commit 0acab32

Browse files
committed
small fix for the bench
1 parent 35a83b0 commit 0acab32

7 files changed

Lines changed: 20 additions & 3 deletions

.gitignore

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,9 @@ data/param_search
88
src/PROBESt/__pycache__
99
tests/PROBESt/__pycache__
1010
tests_outs/
11+
tests_out/
1112
test_outs/
13+
test_out/
1214
test_download/
1315
data/databases/open/probeBase_false_formatted.csv
1416
data/databases/open/probeBase_false_genome_results.csv
@@ -75,8 +77,12 @@ htmlcov/
7577
*.fna
7678
*.faa
7779
*.out
80+
*gz
81+
scripts/loop_generation/
7882
PROBEst.Rproj
7983
.Rproj.user
8084
.Rhistory
8185
articles.tar.bz2
8286
data/databases/articles/artificial_database_structure
87+
data/databases/articles/unvalidated.txt
88+
scripts/databases/combine_databases.py
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.

scripts/loop_generation/run_generation_loop.sh

Lines changed: 14 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@ PROJECT_ROOT="$(cd "$SCRIPT_DIR/../.." && pwd)"
1212

1313
# Default directories
1414
GENOMES_DIR="$PROJECT_ROOT/test_out/all_genomes"
15-
BLASTDB_DIR="$PROJECT_ROOT/test_out/all_blastdb"
16-
OUTPUT_DIR="$PROJECT_ROOT/test_out/all_output"
15+
BLASTDB_DIR="$PROJECT_ROOT/test_out/all_blast"
16+
OUTPUT_DIR="$PROJECT_ROOT/test_out/all_output_fast"
1717
CONTIGS_DIR="$PROJECT_ROOT/test_out/modeling/contigs"
1818
cat $PROJECT_ROOT/test_out/modeling/contigs/* > $PROJECT_ROOT/test_out/fullcontig
1919
CONTIG_DIR="$PROJECT_ROOT/test_out/fullcontig"
@@ -110,8 +110,19 @@ for species_name in "${SPECIES_LIST[@]}"; do
110110
continue
111111
fi
112112

113+
# Randomly select only 3 false databases
114+
if [ ${#false_bases[@]} -gt 3 ]; then
115+
# Create a temporary array with shuffled indices
116+
indices=($(seq 0 $((${#false_bases[@]} - 1)) | shuf | head -n 3))
117+
selected_false_bases=()
118+
for idx in "${indices[@]}"; do
119+
selected_false_bases+=("${false_bases[$idx]}")
120+
done
121+
false_bases=("${selected_false_bases[@]}")
122+
fi
123+
113124
echo "True base: $species_blastdb"
114-
echo "False bases: ${#false_bases[@]} databases"
125+
echo "False bases: ${#false_bases[@]} databases (randomly selected from available)"
115126
echo "Input FASTA: $species_genomes_dir"
116127
echo "Output: $species_output_dir"
117128
echo ""

0 commit comments

Comments
 (0)