Some basic documentation

This commit is contained in:
Lukáš Plevač 2023-11-20 13:14:38 +01:00
parent 7dd7b3ed6e
commit 8a6e1220f9
6 changed files with 290 additions and 72 deletions

View File

@ -1,2 +1,3 @@
import ascii as ascii import ascii as ascii
import molecule as molecule import molecule as molecule
import register as register

View File

@ -1,6 +1,18 @@
##
# @file ascii.py
# @autor Lukáš Plevač <xpleva07@vutbr.cz>
# @brief defines function from print structions in ASCII reprezentation
from molecule import isComplementary from molecule import isComplementary
from molecule import nothing from molecule import nothing
##
# Return number of bases to bind with main chain 0
# @param chainID id of chain in molecule
# @param curPOS current position in molecule
# @param molecule molecule with chain
# @return int
#
def toBindingLen(chainID, curPOS, molecule): def toBindingLen(chainID, curPOS, molecule):
toBLen = 0 toBLen = 0
@ -28,6 +40,18 @@ def toBindingLen(chainID, curPOS, molecule):
return None return None
##
# Show molecule in ASCII reprezentation
# [AB].{D}<CD>
#
# /
# -/
# ----
# ABCD
#
# @param molecule molecule to print
# @param spacing chars between ascii chars
#
def showMolecule(molecule, spacing = ""): def showMolecule(molecule, spacing = ""):
Invlines = [ Invlines = [
"", # register strand "", # register strand

View File

@ -0,0 +1,9 @@
class Assembly:
def __init__(self, asm):
# remove whitespaces
asm = asm.strip()
# load macros from file
self.macros = self.parseMacros(asm)
def parseMacros(self, asm):

View File

@ -1,10 +1,15 @@
##
# @file molecule.py
# @autor Lukáš Plevač <xpleva07@vutbr.cz>
# @brief defines class molecule and functions to work with it
# #
# [aa] - double strand of aa (domain a and domain a) # [aa] - double strand of aa (domain a and domain a)
# {aa} - single strand of aa (domain a and domain a) [upper] # {aa} - single strand of aa (domain a and domain a) [upper]
# <aa> - single strand of aa (domain a and domain a) [downer] # <aa> - single strand of aa (domain a and domain a) [downer]
# #
# example: # example:
# <abc>[ABC]*{abc}<C>{ba}*[CC]*{CA} # <abc>[ABC].{abc}<C>{ba}.[CC].{CA}
# #
# c # c
# b b A # b b A
@ -14,21 +19,48 @@
# a b c A B C C C C # a b c A B C C C C
# #
##
# @brief Char representing space in chain
#
nothing = "-" nothing = "-"
##
# Check if two bases is complementary
# @param baseA one of base to check
# @param baseB second of base to check
# @return baseA is complementary to baseB
#
def isComplementary(baseA, baseB): def isComplementary(baseA, baseB):
return (f"{baseA}*" == baseB) or (baseA == f"{baseB}*") return (f"{baseA}*" == baseB) or (baseA == f"{baseB}*")
##
# Class representing moleculte
#
class Molecule: class Molecule:
##
# Init empty molecule
#
def __init__(self): def __init__(self):
self.chains = [] self.chains = []
##
# Get length of longest chain in molecule
# @return int
#
def __len__(self): def __len__(self):
return self.maxChainSize() return self.maxChainSize()
##
# Return number of count of chains in molecule
# @return int
#
def chainsCount(self): def chainsCount(self):
return len(self.chains) return len(self.chains)
##
# Pad all chains to same length using insert spaces
#
def endPad(self): def endPad(self):
targetSize = self.maxChainSize() targetSize = self.maxChainSize()
@ -36,15 +68,34 @@ class Molecule:
while (targetSize > len(self.chains[id])): while (targetSize > len(self.chains[id])):
self.chains[id].append(nothing) self.chains[id].append(nothing)
##
# Add base to end of chain
# @param base base to add
# @param chainId id of chain to add base
#
def addToChain(self, base, chainId): def addToChain(self, base, chainId):
self.chains[chainId].append(base) self.chains[chainId].append(base)
##
# Get chain as array
# @param chain id of chain
# @return array of chain
#
def getChain(self, chain): def getChain(self, chain):
return self.chains[chain] return self.chains[chain]
##
# Remove chain form molecule
# @param chainId id of chain
# @post all chains ids is reindex
#
def removeChain(self, chainId): def removeChain(self, chainId):
del self.chains[chainId] del self.chains[chainId]
##
# Get length of longest chain in molecule
# @return int
#
def maxChainSize(self): def maxChainSize(self):
maxLen = 0 maxLen = 0
for chain in self.chains: for chain in self.chains:
@ -52,38 +103,82 @@ class Molecule:
return maxLen return maxLen
##
# Add chain to end of chain in molecule
# @param chainID id of chain in molecule to add other chain on end
# @param chain array reprezentation of chain
#
def chain2chain(self, chainID, chain): def chain2chain(self, chainID, chain):
for base in chain: for base in chain:
self.chains[chainID].append(base) self.chains[chainID].append(base)
##
# Add spaces to start of chain in molecule
# @param chainID id of chain in molecule
# @param count count of spaces
#
def padChain(self, chainID, count): def padChain(self, chainID, count):
for _ in range(count): for _ in range(count):
self.chains[chainID].insert(0, nothing) self.chains[chainID].insert(0, nothing)
##
# Add spaces to start of chain in molecule by length of other chain in molecule
# @param chainID id of chain in molecule to pad
# @param targetID if of chain of len count of spaces
#
def padChainToLen(self, chainID, targetID): def padChainToLen(self, chainID, targetID):
targetSize = len(self.chains[targetID]) targetSize = len(self.chains[targetID])
curSize = len(self.chains[chainID]) curSize = len(self.chains[chainID])
self.padChain(chainID, targetSize - curSize) self.padChain(chainID, targetSize - curSize)
##
# Add spaces to start of all chains in molecule
# @param chainID id of chain in molecule to pad
# @param count count of spaces
#
def padAllChains(self, length): def padAllChains(self, length):
for id in range(len(self.chains)): for id in range(len(self.chains)):
self.padChain(id, length) self.padChain(id, length)
##
# Add base to end of chain same as addToChain()
# @param base base to add
# @param chainId id of chain to add base
#
def addBase(self, chainID, base): def addBase(self, chainID, base):
self.chains[chainID].append(base) self.chains[chainID].append(base)
##
# Add chain to molecule
# @return id of new chain
#
def addChain(self): def addChain(self):
chainId = len(self.chains) chainId = len(self.chains)
self.chains.append([]) self.chains.append([])
return chainId return chainId
##
# Update base in chain
# @param base base to set
# @param chainId id of chain to add base
# @param baseID id of base in chain
#
def updateBase(self, chainID, baseID, base): def updateBase(self, chainID, baseID, base):
self.chains[chainID][baseID] = base self.chains[chainID][baseID] = base
##
# Get base from chain
# @param chainId id of chain to add base
# @param baseID id of base in chain
#
def getBase(self, chainID, baseID): def getBase(self, chainID, baseID):
return self.chains[chainID][baseID] return self.chains[chainID][baseID]
##
# Get Number of possible binding on position on molecule
# @param baseID id of base in chain (position in molecule)
#
def bindedCountAt(self, baseID): def bindedCountAt(self, baseID):
binding = 0 binding = 0
for chain in self.chains: for chain in self.chains:
@ -92,6 +187,17 @@ class Molecule:
return binding return binding
##
# Add base to end of chain by char represetion
# A representing base A
# A* representing complement of base A
# A** representing base A (complement of complement)
# @param char char represetation of base to add
# @param chainId id of chain to add base
# @param isBackward is adding from back to front
# -A (+B)
# AB
#
def charAddBase(self, chainID, char, isBackward = False): def charAddBase(self, chainID, char, isBackward = False):
if isBackward: if isBackward:
if len(self.chains[chainID]) == 0 or self.getBase(chainID, 0) != nothing: if len(self.chains[chainID]) == 0 or self.getBase(chainID, 0) != nothing:
@ -108,6 +214,18 @@ class Molecule:
else: else:
self.addBase(chainID, char) self.addBase(chainID, char)
##
# Print raw reprezentation of molecule
# aligmented chains as string
# D
# B* C*
# A B C A B C
#
# Print as:
#
# A B C A B C
# - B* C* D* - -
#
def rawPrint(self): def rawPrint(self):
for chan in self.chains: for chan in self.chains:
raw = "" raw = ""
@ -116,6 +234,27 @@ class Molecule:
print(raw) print(raw)
##
# Convert string notation of molecule to molecule class object
# @param notationStr string notation of molecule
# @return Molecule object
#
# String notation:
# - <> for lower chain
# - [] for double chain
# - {} for upper chain
# - * for complement
# - . for concatenate upper strand with double strand
#
# String notation example:
# <abc>[ABC].{abc}<C>{ba}.[CC].{CA}
#
# c
# b b A
# a C
# A* B* C* C* C*
# | | | | |
# a b c A B C C C C
def parse(notationStr): def parse(notationStr):
newMolecule = Molecule() newMolecule = Molecule()
state = "init" state = "init"

View File

@ -1,20 +1,61 @@
##
# @file register.py
# @autor Lukáš Plevač <xpleva07@vutbr.cz>
# @brief implments REGISTER from SIMD|DNA
import molecule import molecule
import ascii import ascii
class Register: class Register:
##
# Init register
# @param mol molecule reprezenting register
#
def __init__(self, mol = molecule.Molecule()): def __init__(self, mol = molecule.Molecule()):
self.set(mol) self.set(mol)
##
# set register molecule
# @param mol molecule reprezenting register
#
def set(self, mol): def set(self, mol):
self.mol = mol self.mol = mol
def inscription(self, IMols): ##
# Perform instruction on register
# @param mol molecule reprezenting register
#
def instruction(self, IMols):
for mol in IMols: for mol in IMols:
# try bind mol to all possible bindings
self.doAllBinding(mol) self.doAllBinding(mol)
# remove unbinded chains from register (because new imol have bind on older chain with more bases that register)
# ---
# |||
# ---
#
# ---- R
self.removeUnbinded() self.removeUnbinded()
# remove unbinded chains from register (because new imol have bind on more posisin on register that older)
# --
#
# ---
# |||
# ---- R
self.removeReplaced() self.removeReplaced()
# remove all unstable binded chains binded on 1 base or lower
self.removeUnstable() self.removeUnstable()
##
# remove unbinded chains from register (because new imol have bind on more posisin on register that older)
# --
#
# ---
# |||
# ---- R
def removeReplaced(self): def removeReplaced(self):
while True: while True:
done = True done = True
@ -38,6 +79,13 @@ class Register:
if done: if done:
break break
##
# remove unbinded chains from register (because new imol have bind on older chain with more bases that register)
# ---
# |||
# ---
#
# ---- R
def removeUnbinded(self): def removeUnbinded(self):
while True: while True:
done = True done = True
@ -63,6 +111,8 @@ class Register:
if done: if done:
break break
##
# remove all unstable binded chains binded on 1 base or lower
def removeUnstable(self): def removeUnstable(self):
while True: while True:
done = True done = True
@ -71,11 +121,15 @@ class Register:
for chainI in range(self.mol.chainsCount() - 1, 0, -1): for chainI in range(self.mol.chainsCount() - 1, 0, -1):
# for all bases in molecule # for all bases in molecule
bindScore = 0 bindScore = 0
finalBindScore = 0
for pos in range(len(self.mol)): for pos in range(len(self.mol)):
if molecule.isComplementary(self.mol.getBase(chainI, pos), self.mol.getBase(0, pos)) and self.mol.bindedCountAt(pos) == 1: # binde minimaly once if molecule.isComplementary(self.mol.getBase(chainI, pos), self.mol.getBase(0, pos)) and self.mol.bindedCountAt(pos) == 1: # binde minimaly once
bindScore += 1 bindScore += 1
else:
bindScore = 0
finalBindScore = max(finalBindScore, bindScore)
if bindScore < 2: if finalBindScore < 2:
self.mol.removeChain(chainI) self.mol.removeChain(chainI)
done = False done = False
break break
@ -84,6 +138,10 @@ class Register:
if done: if done:
break break
##
# try bind mol to all possible bindings
# Added all imol bindings as new chains
# do not chech if other chain is ocupation this postion
def doAllBinding(self, imol): def doAllBinding(self, imol):
# for all chains in register # for all chains in register
for chainI in range(self.mol.chainsCount()): for chainI in range(self.mol.chainsCount()):
@ -108,73 +166,12 @@ class Register:
self.mol.chain2chain(chain, imol.getChain(0)) self.mol.chain2chain(chain, imol.getChain(0))
self.mol.endPad() self.mol.endPad()
##
# Show register with raw print molecule
def show(self): def show(self):
return self.mol.rawPrint() return self.mol.rawPrint()
##
# Show register with ascii reprezentation of molecule
def asciiShow(self, spaceing = ""): def asciiShow(self, spaceing = ""):
return ascii.showMolecule(self.mol, spaceing) return ascii.showMolecule(self.mol, spaceing)
print("---------------------------------")
print("Before")
print("---------------------------------\n")
# create register
num1 = "{A}[BCDE]"
num0 = "[ABC][DE]"
myreg = Register(molecule.parse(
num1 + num0 + num0 + num1 + num1 + num1 + num1 + num0 + num1 + num0
))
myreg.asciiShow()
print("\n---------------------------------")
print("After")
print("---------------------------------\n")
# do inscription
# mark
# myreg.inscription([
# molecule.parse("<A*B*C*D*E*>")
# ])
# do instruction
# remove
myreg.inscription([
molecule.parse("{D*E*A*F*}")
])
myreg.asciiShow(" ")
myreg.inscription([
molecule.parse("{D*E*A*B*C*G*}")
])
myreg.asciiShow(" ")
myreg.inscription([
molecule.parse("{DEABCG}")
])
myreg.asciiShow(" ")
myreg.inscription([
molecule.parse("{A*B*C*}"),
molecule.parse("{D*E*}")
])
myreg.asciiShow(" ")
myreg.inscription([
molecule.parse("{DEAF}")
])
myreg.asciiShow(" ")
myreg.inscription([
molecule.parse("{B*C*D*E*}")
])
myreg.asciiShow(" ")

48
src/main.py Normal file
View File

@ -0,0 +1,48 @@
from SIMDDNA.register import Register
from SIMDDNA import molecule
from SIMDDNA.assembly import Assembly
asm = Assembly(
"""
define:
0 [ABC][DE]
1 {A}[BCDE]
data:
1001111010
instructions:
{D*E*A*F*} # mark 01
{D*E*A*B*C*G*} # mark 11
{DEABCG} # remove mark 11
{A*B*C*} {D*E*} # write 0
{DEAF} # remove mark 01
{B*C*D*E*} # write 1
"""
)
print("=================================")
print("| Inital state |")
print("=================================")
print("\n")
regs = []
for data in asm.getData():
regs.append(Register(molecule.parse(data)))
regs[-1].asciiShow(spaceing = " ")
iId = 0
for ins in asm.getInstructions():
print("=================================")
print(f"| Instruction {iId} |")
print("=================================")
print("\n")
for reg in regs:
reg.instruction(ins)
reg.asciiShow(spaceing = " ")
iId += 1