Skip to content

Commit

Permalink
update the data collection script to process SV only eQTLS
Browse files Browse the repository at this point in the history
  • Loading branch information
Ramanandan committed Aug 29, 2024
1 parent ce7e2b6 commit 547d9bc
Show file tree
Hide file tree
Showing 2 changed files with 8,402 additions and 7 deletions.
22 changes: 15 additions & 7 deletions data_collection.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,17 +2,25 @@
import argparse

# Set up argument parser
parser = argparse.ArgumentParser(description='Process a VCF file.')
parser = argparse.ArgumentParser(description='Process SV and eQTL files.')

# Add argument for file
parser.add_argument('-f', '--file', type=str, required=True, help='Path to the VCF file (e.g., supporting_variants_for_nstd186.csv.gz)')
# Add arguments for files
parser.add_argument('-s', '--sv-file', type=str, required=True, help='Path to the SV CSV file (e.g., sv_data.csv.gz)')
parser.add_argument('-e', '--eqtl-file', type=str, required=True, help='Path to the eQTL file (e.g., eqtl_table.csv)')

# Parse arguments
args = parser.parse_args()

# Load the data from the specified file
vcf_data = pd.read_csv(args.file)
# Load the SV data from the specified file
sv_data = pd.read_csv(args.sv_file)

# Display the first few rows of the data
print(vcf_data.head())
# Load the eQTL data from the specified file
eqtl_data = pd.read_csv(args.eqtl_file)

# Display the first few rows of each dataframe to confirm
print("SV Data:")
print(sv_data.head())

print("\neQTL Data:")
print(eqtl_data.head())

Loading

0 comments on commit 547d9bc

Please sign in to comment.