-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathgenerate_test_sequence.py
48 lines (41 loc) · 1.46 KB
/
generate_test_sequence.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
import argparse, codecs, re
import numpy as np
def main(args):
num_state = 4
num_symbol = 6
# 状態遷移確率
A = np.zeros((num_state, num_state), dtype=np.float64)
A[0] = 0.4, 0.1, 0.4, 0.1,
A[1] = 0.2, 0.3, 0.2, 0.3,
A[2] = 0.3, 0.2, 0.1, 0.4,
A[3] = 0.1, 0.4, 0.3, 0.2,
# A[0] = 0.8, 0.2, 0.0, 0.0,
# A[1] = 0.4, 0.6, 0.0, 0.0,
# A[2] = 0.0, 0.0, 0.0, 0.0,
# A[3] = 0.0, 0.0, 0.0, 0.0,
# 出力確率
B = np.zeros((num_state, num_symbol), dtype=np.float64)
B[0] = 0.3, 0.7, 0.0, 0.0, 0.0, 0.0
B[1] = 0.0, 0.0, 1.0, 0.0, 0.0, 0.0
B[2] = 0.0, 0.0, 0.0, 1.0, 0.0, 0.0
B[3] = 0.0, 0.0, 0.0, 0.0, 0.7, 0.3
# B[0] = 0.1, 0.9, 0.0, 0.0, 0.0, 0.0,
# B[1] = 0.9, 0.1, 0.0, 0.0, 0.0, 0.0,
# B[2] = 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
# B[3] = 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
with codecs.open("text/test.txt", "w", "utf-8") as f:
for n in range(args.num_seq):
state = 0
sequence = ""
for l in range(args.seq_length):
state = int(np.argwhere(np.random.multinomial(1, A[state]) == 1))
emission = int(np.argwhere(np.random.multinomial(1, B[state]) == 1))
sequence += str(emission) + " "
sequence = re.sub(r" $", "", sequence)
print(sequence)
f.write(sequence + "\n")
if __name__ == "__main__":
parser = argparse.ArgumentParser()
parser.add_argument("-l", "--seq-length", type=int, default=20, help="1つの文の長さ.")
parser.add_argument("-n", "--num-seq", type=int, default=20, help="生成する文の個数.")
main(parser.parse_args())