Skip to content

Commit 3105dce

Browse files
committed
fill-db: Allow to load only *combined*.ttl data files
1 parent f177374 commit 3105dce

File tree

1 file changed

+11
-1
lines changed

1 file changed

+11
-1
lines changed

run/fill-db

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,6 +35,7 @@ batch_size="$BATCH_SIZE_DEFAULT"
3535
validate=false
3636
validate_only=false
3737
validation_output_file="$build_dir/ttl_validation_errors.txt"
38+
data_glob="*.ttl"
3839

3940
function print_help() {
4041

@@ -58,6 +59,9 @@ function print_help() {
5859
echo " The number of Turtle fiels to load into the DB at once [default: $BATCH_SIZE_DEFAULT]"
5960
echo " --offline"
6061
echo " Do not try to fetch git repos"
62+
echo " --combined-only"
63+
echo " Do not load all TTL fiels, only ones that have the string 'combined'"
64+
echo " in their file-name"
6165
echo " --experimental"
6266
echo " Uses the new experimental data source."
6367
echo " NOTE: This data is private, so you need to get access first"
@@ -107,6 +111,9 @@ do
107111
-o|--offline)
108112
online=false
109113
;;
114+
--combined-only)
115+
data_glob="*combined*.ttl"
116+
;;
110117
--experimental)
111118
data_url="$CLONE_URL_EXP_DATA"
112119
;;
@@ -255,9 +262,12 @@ echo
255262
echo "Assembling the list of RDF source files ..."
256263
find \
257264
"$ontology_ttls_root" \
258-
"$data_ttls_root" \
259265
-name "*.ttl" \
260266
> "$input_list_file"
267+
find \
268+
"$data_ttls_root" \
269+
-name "$data_glob" \
270+
>> "$input_list_file"
261271
num_inputs="$(cat "$input_list_file" | wc -l)"
262272
echo "# input files: $num_inputs"
263273

0 commit comments

Comments
 (0)