Spaces:

NiniCat
/

CRISPRTool

Running

App Files Files Community

supercat666 commited on Feb 14

Commit

8a56ec1

•

1 Parent(s): 200a03c

generate .bed file

Browse files

Files changed (2) hide show

app.py +21 -3
cas9on.py +11 -0

app.py CHANGED Viewed

@@ -84,6 +84,7 @@ def initiate_run():
         elif len(transcripts) > 0:
             st.session_state.transcripts = transcripts
 # Check if the selected model is Cas9
 if selected_model == 'Cas9':
     # Use a radio button to select enzymes, making sure only one can be selected at a time
@@ -97,6 +98,20 @@ if selected_model == 'Cas9':
         # Gene symbol entry
         gene_symbol = st.text_input('Enter a Gene Symbol:', key='gene_symbol')
         # Prediction button
         predict_button = st.button('Predict on-target')
@@ -113,6 +128,8 @@ if selected_model == 'Cas9':
                 if gene_sequence:  # Ensure gene_sequence is not empty
                     genbank_file_path = f"{gene_symbol}_crispr_targets.gb"
                     cas9on.generate_genbank_file_from_df(df, gene_sequence, gene_symbol, genbank_file_path)
                     st.write('Top on-target predictions:')
                     st.dataframe(df)
@@ -124,6 +141,10 @@ if selected_model == 'Cas9':
                             file_name=genbank_file_path,
                             mime="text/x-genbank"
                         )
                     # Visualize the GenBank file using pyGenomeViz
                     gv = GenomeViz(
@@ -145,9 +166,6 @@ if selected_model == 'Cas9':
                     fig = gv.plotfig()
                     st.pyplot(fig)
-                    # Clean up the GenBank file after visualization
-                    os.remove(genbank_file_path)
     elif target_selection == 'off-target':
         ENTRY_METHODS = dict(
             manual='Manual entry of target sequence',

         elif len(transcripts) > 0:
             st.session_state.transcripts = transcripts
 # Check if the selected model is Cas9
 if selected_model == 'Cas9':
     # Use a radio button to select enzymes, making sure only one can be selected at a time
         # Gene symbol entry
         gene_symbol = st.text_input('Enter a Gene Symbol:', key='gene_symbol')
+        if 'current_gene_symbol' not in st.session_state:
+            st.session_state['current_gene_symbol'] = ""
+        # Function to clean up old files
+        def clean_up_old_files(gene_symbol):
+            genbank_file_path = f"{gene_symbol}_crispr_targets.gb"
+            bed_file_path = f"{gene_symbol}_crispr_targets.bed"
+            if os.path.exists(genbank_file_path):
+                os.remove(genbank_file_path)
+            if os.path.exists(bed_file_path):
+                os.remove(bed_file_path)
+        if st.session_state['current_gene_symbol'] and gene_symbol != st.session_state['current_gene_symbol']:
+            clean_up_old_files(st.session_state['current_gene_symbol'])
         # Prediction button
         predict_button = st.button('Predict on-target')
                 if gene_sequence:  # Ensure gene_sequence is not empty
                     genbank_file_path = f"{gene_symbol}_crispr_targets.gb"
                     cas9on.generate_genbank_file_from_df(df, gene_sequence, gene_symbol, genbank_file_path)
+                    bed_file_path = f"{gene_symbol}_crispr_targets.bed"
+                    cas9on.create_bed_file_from_df(df, bed_file_path)
                     st.write('Top on-target predictions:')
                     st.dataframe(df)
                             file_name=genbank_file_path,
                             mime="text/x-genbank"
                         )
+                    # Download button for the BED file
+                    with open(bed_file_path, "rb") as file:
+                        st.download_button(label="Download BED File", data=file,
+                            file_name=bed_file_path, mime="text/plain")
                     # Visualize the GenBank file using pyGenomeViz
                     gv = GenomeViz(
                     fig = gv.plotfig()
                     st.pyplot(fig)
     elif target_selection == 'off-target':
         ENTRY_METHODS = dict(
             manual='Manual entry of target sequence',

cas9on.py CHANGED Viewed

@@ -155,3 +155,14 @@ def generate_genbank_file_from_df(df, gene_sequence, gene_symbol, output_path):
     record.annotations["molecule_type"] = "DNA"
     SeqIO.write(record, output_path, "genbank")

     record.annotations["molecule_type"] = "DNA"
     SeqIO.write(record, output_path, "genbank")
+def create_bed_file_from_df(df, output_path):
+    with open(output_path, 'w') as bed_file:
+        for index, row in df.iterrows():
+            chrom = row["Gene ID"]
+            start = int(row["Start Pos"])
+            end = int(row["End Pos"])
+            strand = '+' if int(row["Strand"]) > 0 else '-'
+            gRNA = row["gRNA"]
+            score = row["Prediction"]
+            bed_file.write(f"{chrom}\t{start}\t{end}\t{gRNA}\t{score}\t{strand}\n")