From fafb342fe7e756c7a23b9d371565f089afdf18bd Mon Sep 17 00:00:00 2001 From: Lan Hui Date: Tue, 28 Oct 2025 16:14:13 +0800 Subject: Map experiment ID to library strategy and library source --- Code/make_experiment_library_info_file.py | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100644 Code/make_experiment_library_info_file.py (limited to 'Code/make_experiment_library_info_file.py') diff --git a/Code/make_experiment_library_info_file.py b/Code/make_experiment_library_info_file.py new file mode 100644 index 0000000..9578945 --- /dev/null +++ b/Code/make_experiment_library_info_file.py @@ -0,0 +1,22 @@ +# Usage: python3 make_experiment_library_info_file.py +# +# Purpose: build a file (see EXPERIMENT_LIBRARY_INFO_FILE) that tells whether an experiment is RNA-seq. +# +# 2025-10-28, hui + +from configure import EXPERIMENT_LIBRARY_INFO_FILE, EXPERIMENT_INFO_DIR +from parse_ena_xml import parse_experiment +import glob, os + +result = [] +for fname in sorted(glob.glob(os.path.join(EXPERIMENT_INFO_DIR, '*'))): + _, experiment_id = os.path.split(fname) + d = parse_experiment(fname) + result.append([experiment_id, d[experiment_id]['library_strategy'], d[experiment_id]['library_source']]) + +print(f'Saving to {EXPERIMENT_LIBRARY_INFO_FILE}') +with open(EXPERIMENT_LIBRARY_INFO_FILE, 'a') as f: + for x in result: + f.write('\t'.join(x) + '\n') +print('Done. Saved %d lines.' % (len(result))) + -- cgit v1.2.1