Ubuntu commited on
Commit
a693952
1 Parent(s): a39d163

first commit

Browse files
ConstructBuilder/ConstructBuilder.egg-info/PKG-INFO ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ Metadata-Version: 1.0
2
+ Name: ConstructBuilder
3
+ Version: 0.0.0
4
+ Summary: UNKNOWN
5
+ Home-page: UNKNOWN
6
+ Author: UNKNOWN
7
+ Author-email: UNKNOWN
8
+ License: UNKNOWN
9
+ Description: UNKNOWN
10
+ Platform: UNKNOWN
ConstructBuilder/ConstructBuilder.egg-info/SOURCES.txt ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ setup.py
2
+ ConstructBuilder.egg-info/PKG-INFO
3
+ ConstructBuilder.egg-info/SOURCES.txt
4
+ ConstructBuilder.egg-info/dependency_links.txt
5
+ ConstructBuilder.egg-info/top_level.txt
ConstructBuilder/ConstructBuilder.egg-info/dependency_links.txt ADDED
@@ -0,0 +1 @@
 
 
1
+
ConstructBuilder/ConstructBuilder.egg-info/top_level.txt ADDED
@@ -0,0 +1 @@
 
 
1
+
ConstructBuilder/__init__.py ADDED
File without changes
ConstructBuilder/__pycache__/__init__.cpython-39.pyc ADDED
Binary file (153 Bytes). View file
 
ConstructBuilder/__pycache__/builder.cpython-39.pyc ADDED
Binary file (5.29 kB). View file
 
ConstructBuilder/builder.py ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ G = 'MVSKGEELFTGVVPILVELDGDVNGHKFSVSGEGEGDATYGKLTLKFICTTGKLPVPWPTLVTTLTYGVQCFSRYPDHMKQHDFFKSAMPEGYVQERTIFFKDDGNYKTRAEVKFEGDTLVNRIELKGIDFKEDGNILGHKLEYNYNSHNVYIMADKQKNGIKVNFKIRHNIEDGSVQLADHYQQNTPIGDGPVLLPDNHYLSTQSALSKDPNEKRDHMVLLEFVTAAGITLGMDELYK'
2
+ L2 = 'XXXXXXX'
3
+ T = 'LEENLYFQS'
4
+ L1 = 'GGSGGGSGGGSGGGS'
5
+ H = 'HHHHHH'
6
+ soluTag = {
7
+ 'MBP': 'MKIKTGARILALSALTTMMFSASALAKIEEGKLVIWINGDKGYNGLAEVGKKFEKDTGIKVTVEHPDKLEEKFPQVAATGDGPDIIFWAHDRFGGYAQSGLLAEITPDKAFQDKLYPFTWDAVRYNGKLIAYPIAVEALSLIYNKDLLPNPPKTWEEIPALDKELKAKGKSALMFNLQEPYFTWPLIAADGGYAFKYENGKYDIKDVGVDNAGAKAGLTFLVDLIKNKHMNADTDYSIAEAAFNKGETAMTINGPWAWSNIDTSKVNYGVTVLPTFKGQPSKPFVGVLSAGINAASPNKELAKEFLENYLLTDEGLEAVNKDKPLGAVALKSYEEELAKDPRIAATMENAQKGEIMPNIPQMSAFWYAVRTAVINAASGRQTVDEALKDAQTRITK',
8
+ 'SUMO': 'MSDQEAKPSTEDLGDKKEGEYIKLKVIGQDSSEIHFKVKMTTHLKKLKESYCQRQGVPMNSLRFLFEGQRIADNHTPKELGMEEEDVIEVYQEQTGGHSTV',
9
+ 'Fh8': 'MPSVQEVEKLLHVLDRNGDGKVSAEELKAFADDSKCPLDSNKIKAFIKEHDKNKDGKLDLKELVSILSS',
10
+ 'GST': 'MKLFYKPGACSLASHITLRESGKDFTLVSVDLMKKRLENGDDYFAVNPKGQVPALLLDDGTLLTEGVAIMQYLADSVPDRQLLAPVNSISRYKTIEWLNYIATELHKGFTPLFRPDTPEEYKPTVRAQLEKKLQYVNEALKDEHWICGQRFTIADAYLFTVLRWAYAVKLNLEGLEHIAAFMQRMAERPEVQDALSAEGLK',
11
+ 'MBP': 'MKIKTGARILALSALTTMMFSASALAKIEEGKLVIWINGDKGYNGLAEVGKKFEKDTGIKVTVEHPDKLEEKFPQVAATGDGPDIIFWAHDRFGGYAQSGLLAEITPDKAFQDKLYPFTWDAVRYNGKLIAYPIAVEALSLIYNKDLLPNPPKTWEEIPALDKELKAKGKSALMFNLQEPYFTWPLIAADGGYAFKYENGKYDIKDVGVDNAGAKAGLTFLVDLIKNKHMNADTDYSIAEAAFNKGETAMTINGPWAWSNIDTSKVNYGVTVLPTFKGQPSKPFVGVLSAGINAASPNKELAKEFLENYLLTDEGLEAVNKDKPLGAVALKSYEEELAKDPRIAATMENAQKGEIMPNIPQMSAFWYAVRTAVINAASGRQTVDEALKDAQTRITK',
12
+ 'NusA': 'MNKEILAVVEAVSNEKALPREKIFEALESALATATKKKYEQEIDVRVQIDRKSGDFDTFRRWLVVDEVTQPTKEITLEAARYEDESLNLGDYVEDQIESVTFDRITTQTAKQVIVQKVREAERAMVVDQFREHEGEIITGVVKKVNRDNISLDLGNNAEAVILREDMLPRENFRPGDRVRGVLYSVRPEARGAQLFVTRSKPEMLIELFRIEVPEIGEEVIEIKAAARDPGSRAKIAVKTNDKRIDPVGACVGMRGARVQAVSTELGGERIDIVLWDDNPAQFVINAMAPADVASIVVDEDKHTMDIAVEAGNLAQAIGRNGQNVRLASQLSGWELNVMTDDLQAKHQAEAHAAIDTFTKYLDIDEDFATVLVEEGFSTLEELAYVPMKELLEIEGLDEPTVEALRERAKNALATIAQAQEESLGDNKPADDLLNLEGVDRDLAFKLAARGVCTLEDLAEQGIDDLADIEGLTDEKAGALIMAARNICWFGDEA',
13
+ 'Thioredoxin': 'SDKIIHLTDDSFDTDVLKADGAILVDFWAEWCGPCKMIAPILDEIADEYQGKLTVAKLNIDQNPGTAPKYGIRGIPTLLLFKNGEVAATKVGALSKGQLKEFLDANLA',
14
+ 'FLAG': 'DYKDDDDK',
15
+ 'S-tag': 'KETAAAKFERQHMDS',
16
+ 'CBP': 'KRRWKKNFIAVSAANRFKKISSSGAL',
17
+ 'SUMO': 'MSDQEAKPSTEDLGDKKEGEYIKLKVIGQDSSEIHFKVKMTTHLKKLKESYCQRQGVPMNSLRFLFEGQRIADNHTPKELGMEEEDVIEVYQEQTGGHSTV',
18
+ 'STREPII': 'WSHPQFEK',
19
+ 'BAP': 'GLNDIFEAQKIEWHE',
20
+ 'NT11': 'VSEPHDYNYEK',
21
+ 'Fh8': 'MPSVQEVEKLLHVLDRNGDGKVSAEELKAFADDSKCPLDSNKIKAFIKEHDKNKDGKLDLKELVSILSS',
22
+ 'Tab2': 'VVSHFND',
23
+ 'Z-basic': 'VDNKFNKEQQNAFYEILHLPNLNEEQRNAFIQSLKDDPSQSANLLAEAKKLNDAQPK',
24
+ 'ProteinA': 'MKKKNIYSIRKLGVGIASVTLGTLLISGGVTPAANAAQHDEAQQNAFYQVLNMPNLNADQRNGFIQSLKDDPSQSANVLGEAQKLNDSQAPKADAQQNNFNKDQQSAFYEILNMPNLNEAQRNGFIQSLKDDPSQSTNVLGEAKKLNESQAPKADNNFNKEQQNAFYEILNMPNLNEEQRNGFIQSLKDDPSQSANLLSEAKKLNESQAPKADNKFNKEQQNAFYEILHLPNLNEEQRNGFIQSLKDDPSQSANLLAEAKKLNDAQAPKADNKFNKEQQNAFYEILHLPNLTEEQRNGFIQSLKDDPSVSKEILAEAKKLNDAQAPKEEDNNKPGKEDNNKPGKEDNNKPGKEDNNKPGKEDNNKPGKEDGNKPGKEDNKKPGKEDGNKPGKEDNKKPGKEDGNKPGKEDGNKPGKEDGNGVHVVKPGDTVNDIAKANGADKIAADNKLADKNMIKPGQELVVDKKQPANHADANKAQALPETGEENPFIGTTVFGGLSLALGAALLEL',
25
+ 'IMPACT': 'TNPGVSAWQVNTAYTAGQLVTYNGKTYKCLQPHTSLAGWEPSNVPALWQLQ',
26
+ 'mysB': 'MTMYATLEEAIDAAREEFLADNPGIDAEDANVQQFNAQKYVLQDGDIMWQVEFFADEGEEGECLPMLSGEAAQSVFDGDYDEIEIRQEWQEENTLHEWDEGEFQLEPPLDTEEGRAAADEWDER',
27
+ 'PolyR': 'RRRRR',
28
+ 'c-myc': 'EQKLISEEDL',
29
+ 'S': 'KETAAAKFERQHMDS',
30
+ 'SBP-tag': 'MDEKTTGWRGGHVVEGLAGELEQLRARLEHHPQGQREP',
31
+ 'Strep-tag': 'WRHPQFGG',
32
+ 'Twin-Strep-tag': 'SAWSHPQFEKGGGSGGGSGGSAWSHPQFEK',
33
+ 'HAT': 'KDHLIHNVHKEFHAHAHNK',
34
+ 'BCCP': 'MDIRKIKKLIELVEESGISELEISEGEESVRISRAAPAASFPVMQQAYAAPMMQQPAQSNAAAPATVPSMEAPAAAEISGHIVRSPMVGTFYRTPSPDAKAFIEVGQKVNVDTLCIVEAMKMMNQIEADKSGTVKAILVESGQPVEFDEPLVVIE',
35
+ 'HaloTag': 'SGSAEIGTGFPFDPHYVEVLGERMHYVDVGPRDGTPVLFLHGNPTSSYVWRNIIPHVAPTHRCIAPDLIGMGKSDKPDLGYFFDDHVRFMDAFIEALGLEEVVLVIHDWGSALGFHWAKRNPERVKGIAFMEFIRPIPTWDEWPEFARETFQAFRTTDVGRKLIIDQNVFIEGTLPCGVVRPLTEVEMDHYREPFLNPVDREPLWRFPNELPIAGEPANIVALVEEYMDWLHQSPVPKLLFWGTPGVLIPPAEAARLAKSLPNCKAVDIGPGLNLLQEDNPDLIGSEIARWLSTLEISG'
36
+ }
37
+
38
+ def run_N(P:str, gfp:bool, solu_tag:list)->dict:
39
+ const = {}
40
+ if gfp:
41
+ for f in solu_tag:
42
+ F = soluTag[f]
43
+ const[f"con_gfp_N_{f}"] = P+T+L1+F+L2+G+H
44
+ if not solu_tag:
45
+ const[f"con_gfp_N"] = P+T+L2+G+H
46
+ else:
47
+ for f in solu_tag:
48
+ F = soluTag[f]
49
+ const[f"con_N_{f}"] = P+T+L1+F+H
50
+ if not solu_tag:
51
+ const[f"con_N"] = P+T+H # TODO: verify this one
52
+ return const
53
+
54
+ def run_C(P:str, gfp:bool, solu_tag:list)->dict:
55
+ const = {}
56
+ if gfp:
57
+ for f in solu_tag:
58
+ F = soluTag[f]
59
+ const[f"con_gfp_C_{f}"] = H+G+L2+F+L1+T+P
60
+ if not solu_tag:
61
+ const[f"con_gfp_C"] = H+G+L2+T+P
62
+ else:
63
+ for f in solu_tag:
64
+ F = soluTag[f]
65
+ const[f"con_C_{f}"] = H+F+L1+T+P
66
+ if not solu_tag:
67
+ const[f"con_C"] = H+T+P #TODO verify this
68
+ return const
69
+
70
+ def build(P:str, solu_tag:list, GFP:bool, P_pos:str)->dict:
71
+ """
72
+ This function calculate constructs to Protera's LAB considering:
73
+ -orientation N to C terminal, or reverse
74
+ -With/withou GFP
75
+ -Fusion Proteins
76
+
77
+ usage = build( amino_sequence, solutags, GFP:True/false, P_pos:"N+C","N","C")
78
+ solutags availables:
79
+ 'MBP', 'SUMO', 'Fh8', 'GST', 'NusA', 'Thioredoxin', 'FLAG', 'S-tag', 'CBP', 'STREPII', 'BAP', 'NT11', 'Tab2', 'Z-basic', 'ProteinA', 'IMPACT', 'mysB', 'PolyR', 'c-myc', 'S', 'SBP-tag', 'Strep-tag', 'Twin-Strep-tag', 'HAT', 'BCCP', 'HaloTag'
80
+
81
+ """
82
+ if "all" in solu_tag:
83
+ solu_tag = list(soluTag.keys())
84
+
85
+ d1 = {}
86
+ d2 = {}
87
+
88
+ if "C" in P_pos:
89
+ d2 = run_C(P, GFP, solu_tag)
90
+
91
+ if "N" in P_pos:
92
+ d1 = run_N(P, GFP, solu_tag)
93
+
94
+ return {**d1,**d2}
ConstructBuilder/setup.py ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ import setuptools
2
+ setuptools.setup(name="ConstructBuilder")
construct.py CHANGED
@@ -19,8 +19,8 @@ def LabFusion(name, file , uni_seq , orientation:str="NC", gfp:bool=False, sol_t
19
  dick[name] = build(uni_seq, sol_tag, gfp, orientation)
20
  table = pd.DataFrame.from_dict(dick)
21
 
22
- table.to_csv(f"/home/ubuntu/1TB_disk/constructos/gradio_projects/constructs_{name}.csv")
23
- return table, f"/home/ubuntu/1TB_disk/constructos/gradio_projects/constructs_{name}.csv"
24
 
25
 
26
  int_align = gr.Interface(fn=LabFusion,
 
19
  dick[name] = build(uni_seq, sol_tag, gfp, orientation)
20
  table = pd.DataFrame.from_dict(dick)
21
 
22
+ table.to_csv(f"./gradio_projects/constructs_{name}.csv")
23
+ return table, f"./gradio_projects/constructs_{name}.csv"
24
 
25
 
26
  int_align = gr.Interface(fn=LabFusion,