forked from bmajoros/python
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathNgramIterator.py
executable file
·90 lines (80 loc) · 3.28 KB
/
NgramIterator.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
#!/usr/bin/env python
#=========================================================================
# This is OPEN SOURCE SOFTWARE governed by the Gnu General Public
# License (GPL) version 3, as described at www.opensource.org.
# Copyright (C)2017 William H. Majoros ([email protected]).
#=========================================================================
from __future__ import (absolute_import, division, print_function,
unicode_literals, generators, nested_scopes, with_statement)
from builtins import (bytes, dict, int, list, object, range, str, ascii,
chr, hex, input, next, oct, open, pow, round, super, filter, map, zip)
# The above imports should allow this program to run in both Python 2 and
# Python 3. You might need to update your version of module "future".
######################################################################
#
# NgramIterator.py bmajoros
#
# Attributes:
# array ngram : array of integer indices into alphabet string
# string alphabet
# Methods:
# ngramIterator=NgramIterator("ATCG",N)
# string=ngramIterator.nextString() # returns None if no more
# ngramIterator.reset()
# Private methods:
# self.ngramToString()
######################################################################
class NgramIterator:
#---------------------------------------------------------------------
# PUBLIC METHODS
#---------------------------------------------------------------------
# ngramIterator=NgramIterator("ATCG",N)
def __init__(self,alphabet,N):
ngram=[]
alphaSize=len(alphabet)
for i in range(N-1): ngram.append(0)
if(N>0): ngram.append(-1)
self.alphabet=alphabet
self.ngram=ngram
#---------------------------------------------------------------------
# ngramIterator.reset()
def reset(self):
ngram=self.ngram
L=len(ngram)
for i in range(L-1): ngram[i]=0
ngram[L-1]=-1
#---------------------------------------------------------------------
# string=ngramIterator.nextString() # returns undef if no more
def nextString(self):
alphabet=self.alphabet
ngram=self.ngram
if(ngram is None): return None
L=len(ngram)
if(L==0):
self.ngram=None
return ""
alphaSize=len(alphabet)
for i in range(L-1,-1,-1): # for($i=$len-1 ; $i>=0 ; --$i)
ngram[i]+=1
index=ngram[i]
if(index<alphaSize): return self.ngramToString()
ngram[i]=0
return None
#---------------------------------------------------------------------
#---------------------------------------------------------------------
#---------------------------------------------------------------------
#---------------------------------------------------------------------
#---------------------------------------------------------------------
#---------------------------------------------------------------------
# PRIVATE METHODS
#---------------------------------------------------------------------
# self.ngramToString()
def ngramToString(self):
ngram=self.ngram
alphabet=self.alphabet
length=len(ngram)
string=""
for i in range(length):
index=ngram[i]
string+=alphabet[index:index+1]
return string