Spaces:

HUBioDataLab
/

ASCARIS

Sleeping

App Files Files Community

fatmacankara commited on Dec 12, 2023

Commit

5b00e58

1 Parent(s): a802398

Update code/alphafold_featureVector.py

Browse files

Files changed (1) hide show

code/alphafold_featureVector.py +18 -2

code/alphafold_featureVector.py CHANGED Viewed

@@ -347,12 +347,14 @@ def alphafold(input_set, mode, impute):
         ## Physicochemical properties
         print('Adding physicochemical properties...\n')
         data = add_physicochemical(data)
-        st.write('DOMAIN BAK')
         st.write(data)
         ## Domains
         print('Adding domains\n')
         data = add_domains(data, path_to_domains)
         ## Processing data frame
         data = data.astype(str)
@@ -372,6 +374,12 @@ def alphafold(input_set, mode, impute):
         ## canonical_fasta : Dataframe including canonical sequence for the protein of interest. Obtained from UniProt.
         ## isoform_fasta: Dataframe including isoform sequences for the protein of interest. Obtained from UniProt.
         not_match_in_uniprot, uniprot_matched, canonical_fasta, isoform_fasta = uniprotSequenceMatch(data)
         not_match_in_uniprot = not_match_in_uniprot.reset_index().drop(['index'], axis=1)
@@ -379,7 +387,10 @@ def alphafold(input_set, mode, impute):
             not_match_in_uniprot[key] = ''
         not_match_in_uniprot = not_match_in_uniprot.rename(columns=change_names)
         uniprot_matched = add_annotations(uniprot_matched)
-        st.write('uniprot_matched')
         st.write(uniprot_matched)
@@ -401,6 +412,9 @@ def alphafold(input_set, mode, impute):
                     uniprot_matched.at[w, q] = 'nan'
         uniprot_matched = uniprot_matched.rename(columns=change_names)
         uniprot_matched['wt_sequence_match'] = uniprot_matched['wt_sequence_match'].astype(str)
         ## Avoiding downloading files for SASA calculation if already downloaded.
@@ -444,6 +458,8 @@ def alphafold(input_set, mode, impute):
         uniprot_matched = uniprot_matched.replace({'nan': np.NaN})
         for annot in ['Domain', 'Alternative sequence', 'Chain', 'Sequence conflict', 'Compositional bias']:
             try:
                 uniprot_matched = uniprot_matched.drop(columns=annot)

         ## Physicochemical properties
         print('Adding physicochemical properties...\n')
         data = add_physicochemical(data)
+        st.write('add_physicochemical')
         st.write(data)
         ## Domains
         print('Adding domains\n')
         data = add_domains(data, path_to_domains)
+        st.write('add_domains')
+        st.write(data)
         ## Processing data frame
         data = data.astype(str)
         ## canonical_fasta : Dataframe including canonical sequence for the protein of interest. Obtained from UniProt.
         ## isoform_fasta: Dataframe including isoform sequences for the protein of interest. Obtained from UniProt.
         not_match_in_uniprot, uniprot_matched, canonical_fasta, isoform_fasta = uniprotSequenceMatch(data)
+        st.write('not_match_in_uniprot')
+        st.write(not_match_in_uniprot)
+        st.write('uniprot_matched')
+        st.write(uniprot_matched)
         not_match_in_uniprot = not_match_in_uniprot.reset_index().drop(['index'], axis=1)
             not_match_in_uniprot[key] = ''
         not_match_in_uniprot = not_match_in_uniprot.rename(columns=change_names)
         uniprot_matched = add_annotations(uniprot_matched)
+        st.write('not_match_in_uniprot col name changed')
+        st.write(not_match_in_uniprot)
+        st.write('uniprot_matched annotation added')
         st.write(uniprot_matched)
                     uniprot_matched.at[w, q] = 'nan'
         uniprot_matched = uniprot_matched.rename(columns=change_names)
         uniprot_matched['wt_sequence_match'] = uniprot_matched['wt_sequence_match'].astype(str)
+        st.write('burda ne oldu')
+        st.write(uniprot_matched)
         ## Avoiding downloading files for SASA calculation if already downloaded.
         uniprot_matched = uniprot_matched.replace({'nan': np.NaN})
+        st.write('isoform match vs ')
+        st.write(uniprot_matched)
         for annot in ['Domain', 'Alternative sequence', 'Chain', 'Sequence conflict', 'Compositional bias']:
             try:
                 uniprot_matched = uniprot_matched.drop(columns=annot)