Spaces:
Running
Running
Ubuntu
commited on
Commit
•
a693952
1
Parent(s):
a39d163
first commit
Browse files- ConstructBuilder/ConstructBuilder.egg-info/PKG-INFO +10 -0
- ConstructBuilder/ConstructBuilder.egg-info/SOURCES.txt +5 -0
- ConstructBuilder/ConstructBuilder.egg-info/dependency_links.txt +1 -0
- ConstructBuilder/ConstructBuilder.egg-info/top_level.txt +1 -0
- ConstructBuilder/__init__.py +0 -0
- ConstructBuilder/__pycache__/__init__.cpython-39.pyc +0 -0
- ConstructBuilder/__pycache__/builder.cpython-39.pyc +0 -0
- ConstructBuilder/builder.py +94 -0
- ConstructBuilder/setup.py +2 -0
- construct.py +2 -2
ConstructBuilder/ConstructBuilder.egg-info/PKG-INFO
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Metadata-Version: 1.0
|
2 |
+
Name: ConstructBuilder
|
3 |
+
Version: 0.0.0
|
4 |
+
Summary: UNKNOWN
|
5 |
+
Home-page: UNKNOWN
|
6 |
+
Author: UNKNOWN
|
7 |
+
Author-email: UNKNOWN
|
8 |
+
License: UNKNOWN
|
9 |
+
Description: UNKNOWN
|
10 |
+
Platform: UNKNOWN
|
ConstructBuilder/ConstructBuilder.egg-info/SOURCES.txt
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
setup.py
|
2 |
+
ConstructBuilder.egg-info/PKG-INFO
|
3 |
+
ConstructBuilder.egg-info/SOURCES.txt
|
4 |
+
ConstructBuilder.egg-info/dependency_links.txt
|
5 |
+
ConstructBuilder.egg-info/top_level.txt
|
ConstructBuilder/ConstructBuilder.egg-info/dependency_links.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
|
ConstructBuilder/ConstructBuilder.egg-info/top_level.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
|
ConstructBuilder/__init__.py
ADDED
File without changes
|
ConstructBuilder/__pycache__/__init__.cpython-39.pyc
ADDED
Binary file (153 Bytes). View file
|
|
ConstructBuilder/__pycache__/builder.cpython-39.pyc
ADDED
Binary file (5.29 kB). View file
|
|
ConstructBuilder/builder.py
ADDED
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
G = 'MVSKGEELFTGVVPILVELDGDVNGHKFSVSGEGEGDATYGKLTLKFICTTGKLPVPWPTLVTTLTYGVQCFSRYPDHMKQHDFFKSAMPEGYVQERTIFFKDDGNYKTRAEVKFEGDTLVNRIELKGIDFKEDGNILGHKLEYNYNSHNVYIMADKQKNGIKVNFKIRHNIEDGSVQLADHYQQNTPIGDGPVLLPDNHYLSTQSALSKDPNEKRDHMVLLEFVTAAGITLGMDELYK'
|
2 |
+
L2 = 'XXXXXXX'
|
3 |
+
T = 'LEENLYFQS'
|
4 |
+
L1 = 'GGSGGGSGGGSGGGS'
|
5 |
+
H = 'HHHHHH'
|
6 |
+
soluTag = {
|
7 |
+
'MBP': 'MKIKTGARILALSALTTMMFSASALAKIEEGKLVIWINGDKGYNGLAEVGKKFEKDTGIKVTVEHPDKLEEKFPQVAATGDGPDIIFWAHDRFGGYAQSGLLAEITPDKAFQDKLYPFTWDAVRYNGKLIAYPIAVEALSLIYNKDLLPNPPKTWEEIPALDKELKAKGKSALMFNLQEPYFTWPLIAADGGYAFKYENGKYDIKDVGVDNAGAKAGLTFLVDLIKNKHMNADTDYSIAEAAFNKGETAMTINGPWAWSNIDTSKVNYGVTVLPTFKGQPSKPFVGVLSAGINAASPNKELAKEFLENYLLTDEGLEAVNKDKPLGAVALKSYEEELAKDPRIAATMENAQKGEIMPNIPQMSAFWYAVRTAVINAASGRQTVDEALKDAQTRITK',
|
8 |
+
'SUMO': 'MSDQEAKPSTEDLGDKKEGEYIKLKVIGQDSSEIHFKVKMTTHLKKLKESYCQRQGVPMNSLRFLFEGQRIADNHTPKELGMEEEDVIEVYQEQTGGHSTV',
|
9 |
+
'Fh8': 'MPSVQEVEKLLHVLDRNGDGKVSAEELKAFADDSKCPLDSNKIKAFIKEHDKNKDGKLDLKELVSILSS',
|
10 |
+
'GST': 'MKLFYKPGACSLASHITLRESGKDFTLVSVDLMKKRLENGDDYFAVNPKGQVPALLLDDGTLLTEGVAIMQYLADSVPDRQLLAPVNSISRYKTIEWLNYIATELHKGFTPLFRPDTPEEYKPTVRAQLEKKLQYVNEALKDEHWICGQRFTIADAYLFTVLRWAYAVKLNLEGLEHIAAFMQRMAERPEVQDALSAEGLK',
|
11 |
+
'MBP': 'MKIKTGARILALSALTTMMFSASALAKIEEGKLVIWINGDKGYNGLAEVGKKFEKDTGIKVTVEHPDKLEEKFPQVAATGDGPDIIFWAHDRFGGYAQSGLLAEITPDKAFQDKLYPFTWDAVRYNGKLIAYPIAVEALSLIYNKDLLPNPPKTWEEIPALDKELKAKGKSALMFNLQEPYFTWPLIAADGGYAFKYENGKYDIKDVGVDNAGAKAGLTFLVDLIKNKHMNADTDYSIAEAAFNKGETAMTINGPWAWSNIDTSKVNYGVTVLPTFKGQPSKPFVGVLSAGINAASPNKELAKEFLENYLLTDEGLEAVNKDKPLGAVALKSYEEELAKDPRIAATMENAQKGEIMPNIPQMSAFWYAVRTAVINAASGRQTVDEALKDAQTRITK',
|
12 |
+
'NusA': 'MNKEILAVVEAVSNEKALPREKIFEALESALATATKKKYEQEIDVRVQIDRKSGDFDTFRRWLVVDEVTQPTKEITLEAARYEDESLNLGDYVEDQIESVTFDRITTQTAKQVIVQKVREAERAMVVDQFREHEGEIITGVVKKVNRDNISLDLGNNAEAVILREDMLPRENFRPGDRVRGVLYSVRPEARGAQLFVTRSKPEMLIELFRIEVPEIGEEVIEIKAAARDPGSRAKIAVKTNDKRIDPVGACVGMRGARVQAVSTELGGERIDIVLWDDNPAQFVINAMAPADVASIVVDEDKHTMDIAVEAGNLAQAIGRNGQNVRLASQLSGWELNVMTDDLQAKHQAEAHAAIDTFTKYLDIDEDFATVLVEEGFSTLEELAYVPMKELLEIEGLDEPTVEALRERAKNALATIAQAQEESLGDNKPADDLLNLEGVDRDLAFKLAARGVCTLEDLAEQGIDDLADIEGLTDEKAGALIMAARNICWFGDEA',
|
13 |
+
'Thioredoxin': 'SDKIIHLTDDSFDTDVLKADGAILVDFWAEWCGPCKMIAPILDEIADEYQGKLTVAKLNIDQNPGTAPKYGIRGIPTLLLFKNGEVAATKVGALSKGQLKEFLDANLA',
|
14 |
+
'FLAG': 'DYKDDDDK',
|
15 |
+
'S-tag': 'KETAAAKFERQHMDS',
|
16 |
+
'CBP': 'KRRWKKNFIAVSAANRFKKISSSGAL',
|
17 |
+
'SUMO': 'MSDQEAKPSTEDLGDKKEGEYIKLKVIGQDSSEIHFKVKMTTHLKKLKESYCQRQGVPMNSLRFLFEGQRIADNHTPKELGMEEEDVIEVYQEQTGGHSTV',
|
18 |
+
'STREPII': 'WSHPQFEK',
|
19 |
+
'BAP': 'GLNDIFEAQKIEWHE',
|
20 |
+
'NT11': 'VSEPHDYNYEK',
|
21 |
+
'Fh8': 'MPSVQEVEKLLHVLDRNGDGKVSAEELKAFADDSKCPLDSNKIKAFIKEHDKNKDGKLDLKELVSILSS',
|
22 |
+
'Tab2': 'VVSHFND',
|
23 |
+
'Z-basic': 'VDNKFNKEQQNAFYEILHLPNLNEEQRNAFIQSLKDDPSQSANLLAEAKKLNDAQPK',
|
24 |
+
'ProteinA': 'MKKKNIYSIRKLGVGIASVTLGTLLISGGVTPAANAAQHDEAQQNAFYQVLNMPNLNADQRNGFIQSLKDDPSQSANVLGEAQKLNDSQAPKADAQQNNFNKDQQSAFYEILNMPNLNEAQRNGFIQSLKDDPSQSTNVLGEAKKLNESQAPKADNNFNKEQQNAFYEILNMPNLNEEQRNGFIQSLKDDPSQSANLLSEAKKLNESQAPKADNKFNKEQQNAFYEILHLPNLNEEQRNGFIQSLKDDPSQSANLLAEAKKLNDAQAPKADNKFNKEQQNAFYEILHLPNLTEEQRNGFIQSLKDDPSVSKEILAEAKKLNDAQAPKEEDNNKPGKEDNNKPGKEDNNKPGKEDNNKPGKEDNNKPGKEDGNKPGKEDNKKPGKEDGNKPGKEDNKKPGKEDGNKPGKEDGNKPGKEDGNGVHVVKPGDTVNDIAKANGADKIAADNKLADKNMIKPGQELVVDKKQPANHADANKAQALPETGEENPFIGTTVFGGLSLALGAALLEL',
|
25 |
+
'IMPACT': 'TNPGVSAWQVNTAYTAGQLVTYNGKTYKCLQPHTSLAGWEPSNVPALWQLQ',
|
26 |
+
'mysB': 'MTMYATLEEAIDAAREEFLADNPGIDAEDANVQQFNAQKYVLQDGDIMWQVEFFADEGEEGECLPMLSGEAAQSVFDGDYDEIEIRQEWQEENTLHEWDEGEFQLEPPLDTEEGRAAADEWDER',
|
27 |
+
'PolyR': 'RRRRR',
|
28 |
+
'c-myc': 'EQKLISEEDL',
|
29 |
+
'S': 'KETAAAKFERQHMDS',
|
30 |
+
'SBP-tag': 'MDEKTTGWRGGHVVEGLAGELEQLRARLEHHPQGQREP',
|
31 |
+
'Strep-tag': 'WRHPQFGG',
|
32 |
+
'Twin-Strep-tag': 'SAWSHPQFEKGGGSGGGSGGSAWSHPQFEK',
|
33 |
+
'HAT': 'KDHLIHNVHKEFHAHAHNK',
|
34 |
+
'BCCP': 'MDIRKIKKLIELVEESGISELEISEGEESVRISRAAPAASFPVMQQAYAAPMMQQPAQSNAAAPATVPSMEAPAAAEISGHIVRSPMVGTFYRTPSPDAKAFIEVGQKVNVDTLCIVEAMKMMNQIEADKSGTVKAILVESGQPVEFDEPLVVIE',
|
35 |
+
'HaloTag': 'SGSAEIGTGFPFDPHYVEVLGERMHYVDVGPRDGTPVLFLHGNPTSSYVWRNIIPHVAPTHRCIAPDLIGMGKSDKPDLGYFFDDHVRFMDAFIEALGLEEVVLVIHDWGSALGFHWAKRNPERVKGIAFMEFIRPIPTWDEWPEFARETFQAFRTTDVGRKLIIDQNVFIEGTLPCGVVRPLTEVEMDHYREPFLNPVDREPLWRFPNELPIAGEPANIVALVEEYMDWLHQSPVPKLLFWGTPGVLIPPAEAARLAKSLPNCKAVDIGPGLNLLQEDNPDLIGSEIARWLSTLEISG'
|
36 |
+
}
|
37 |
+
|
38 |
+
def run_N(P:str, gfp:bool, solu_tag:list)->dict:
|
39 |
+
const = {}
|
40 |
+
if gfp:
|
41 |
+
for f in solu_tag:
|
42 |
+
F = soluTag[f]
|
43 |
+
const[f"con_gfp_N_{f}"] = P+T+L1+F+L2+G+H
|
44 |
+
if not solu_tag:
|
45 |
+
const[f"con_gfp_N"] = P+T+L2+G+H
|
46 |
+
else:
|
47 |
+
for f in solu_tag:
|
48 |
+
F = soluTag[f]
|
49 |
+
const[f"con_N_{f}"] = P+T+L1+F+H
|
50 |
+
if not solu_tag:
|
51 |
+
const[f"con_N"] = P+T+H # TODO: verify this one
|
52 |
+
return const
|
53 |
+
|
54 |
+
def run_C(P:str, gfp:bool, solu_tag:list)->dict:
|
55 |
+
const = {}
|
56 |
+
if gfp:
|
57 |
+
for f in solu_tag:
|
58 |
+
F = soluTag[f]
|
59 |
+
const[f"con_gfp_C_{f}"] = H+G+L2+F+L1+T+P
|
60 |
+
if not solu_tag:
|
61 |
+
const[f"con_gfp_C"] = H+G+L2+T+P
|
62 |
+
else:
|
63 |
+
for f in solu_tag:
|
64 |
+
F = soluTag[f]
|
65 |
+
const[f"con_C_{f}"] = H+F+L1+T+P
|
66 |
+
if not solu_tag:
|
67 |
+
const[f"con_C"] = H+T+P #TODO verify this
|
68 |
+
return const
|
69 |
+
|
70 |
+
def build(P:str, solu_tag:list, GFP:bool, P_pos:str)->dict:
|
71 |
+
"""
|
72 |
+
This function calculate constructs to Protera's LAB considering:
|
73 |
+
-orientation N to C terminal, or reverse
|
74 |
+
-With/withou GFP
|
75 |
+
-Fusion Proteins
|
76 |
+
|
77 |
+
usage = build( amino_sequence, solutags, GFP:True/false, P_pos:"N+C","N","C")
|
78 |
+
solutags availables:
|
79 |
+
'MBP', 'SUMO', 'Fh8', 'GST', 'NusA', 'Thioredoxin', 'FLAG', 'S-tag', 'CBP', 'STREPII', 'BAP', 'NT11', 'Tab2', 'Z-basic', 'ProteinA', 'IMPACT', 'mysB', 'PolyR', 'c-myc', 'S', 'SBP-tag', 'Strep-tag', 'Twin-Strep-tag', 'HAT', 'BCCP', 'HaloTag'
|
80 |
+
|
81 |
+
"""
|
82 |
+
if "all" in solu_tag:
|
83 |
+
solu_tag = list(soluTag.keys())
|
84 |
+
|
85 |
+
d1 = {}
|
86 |
+
d2 = {}
|
87 |
+
|
88 |
+
if "C" in P_pos:
|
89 |
+
d2 = run_C(P, GFP, solu_tag)
|
90 |
+
|
91 |
+
if "N" in P_pos:
|
92 |
+
d1 = run_N(P, GFP, solu_tag)
|
93 |
+
|
94 |
+
return {**d1,**d2}
|
ConstructBuilder/setup.py
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
import setuptools
|
2 |
+
setuptools.setup(name="ConstructBuilder")
|
construct.py
CHANGED
@@ -19,8 +19,8 @@ def LabFusion(name, file , uni_seq , orientation:str="NC", gfp:bool=False, sol_t
|
|
19 |
dick[name] = build(uni_seq, sol_tag, gfp, orientation)
|
20 |
table = pd.DataFrame.from_dict(dick)
|
21 |
|
22 |
-
table.to_csv(f"
|
23 |
-
return table, f"
|
24 |
|
25 |
|
26 |
int_align = gr.Interface(fn=LabFusion,
|
|
|
19 |
dick[name] = build(uni_seq, sol_tag, gfp, orientation)
|
20 |
table = pd.DataFrame.from_dict(dick)
|
21 |
|
22 |
+
table.to_csv(f"./gradio_projects/constructs_{name}.csv")
|
23 |
+
return table, f"./gradio_projects/constructs_{name}.csv"
|
24 |
|
25 |
|
26 |
int_align = gr.Interface(fn=LabFusion,
|