forked from BimberLab/DiscvrLabKeyModules
-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathSequenceAnalysis-0.00-11.20.sql
More file actions
1831 lines (1629 loc) · 306 KB
/
SequenceAnalysis-0.00-11.20.sql
File metadata and controls
1831 lines (1629 loc) · 306 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
/*
* Copyright (c) 2012 LabKey Corporation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/* SequenceAnalysis-0.00-0.10.sql */
CREATE SCHEMA SequenceAnalysis;
-- ----------------------------
-- Table structure for sequenceanalysis.module_properties
-- ----------------------------
CREATE TABLE sequenceanalysis.module_properties
(
RowId SERIAL NOT NULL,
prop_name varchar(255) DEFAULT NULL,
stringvalue varchar(255) DEFAULT NULL,
floatvalue float DEFAULT NULL,
Container ENTITYID NOT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_module_properties PRIMARY KEY (rowId)
)
WITH (OIDS=FALSE);
-- ----------------------------
-- Table structure for sequenceanalysis.site_module_properties
-- ----------------------------
CREATE TABLE sequenceanalysis.site_module_properties
(
prop_name varchar(255) DEFAULT NULL,
stringvalue varchar(255) DEFAULT NULL,
floatvalue float DEFAULT NULL,
Container ENTITYID NOT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_site_module_properties PRIMARY KEY (prop_name)
)
WITH (OIDS=FALSE);
-- ----------------------------
-- Table structure for sequenceanalysis.sequence_analyses
-- ----------------------------
CREATE TABLE sequenceanalysis.sequence_analyses
(
RowId SERIAL NOT NULL,
type varchar(255) DEFAULT NULL,
runId INTEGER DEFAULT NULL,
sampleId INTEGER DEFAULT NULL,
inputFile INTEGER DEFAULT NULL,
outputFile INTEGER DEFAULT NULL,
makePublic bool DEFAULT FALSE,
Container ENTITYID NOT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_sequence_analyses PRIMARY KEY (rowId)
)
WITH (OIDS=FALSE);
-- ----------------------------
-- Table structure for sequenceanalysis.external_dbs
-- ----------------------------
CREATE TABLE sequenceanalysis.external_dbs
(
RowId SERIAL NOT NULL,
Name VARCHAR(255) DEFAULT NULL,
Details VARCHAR(255) DEFAULT NULL,
Container ENTITYID NOT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_external_dbs PRIMARY KEY (rowId)
)
WITH (OIDS=FALSE);
-- ----------------------------
-- Table structure for sequenceanalysis.barcodes
-- ----------------------------
CREATE TABLE sequenceanalysis.barcodes
(
tag_name VARCHAR(255) NOT NULL,
sequence VARCHAR(255) NOT NULL,
group_name VARCHAR(255) DEFAULT NULL,
--Container ENTITYID NOT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_barcodes PRIMARY KEY (tag_name),
CONSTRAINT UNIQUE_barcodes UNIQUE (sequence)
)
WITH (OIDS=FALSE);
-- ----------------------------
-- Records of barcodes
-- ----------------------------
-- @SkipOnEmptySchemasBegin
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID01', 'ACGAGTGCGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID02', 'ACGCTCGACA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID03', 'AGACGCACTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID04', 'AGCACTGTAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID05', 'ATCAGACACG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID06', 'ATATCGCGAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID07', 'CGTGTCTCTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID08', 'CTCGCGTGTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID09', 'TAGTATCAGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID10', 'TCTCTATGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID11', 'TGATACGTCT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID12', 'TACTGAGCTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID13', 'CATAGTAGTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID14', 'CGAGAGATAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID15', 'ATACGACGTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID16', 'TCACGTACTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID17', 'CGTCTAGTAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID18', 'TCTACGTAGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID19', 'TGTACTACTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID20', 'ACGACTACAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID21', 'CGTAGACTAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID22', 'TACGAGTATG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID23', 'TACTCTCGTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID24', 'TAGAGACGAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID25', 'TCGTCGCTCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID26', 'ACATACGCGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID27', 'ACGCGAGTAT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID28', 'ACTACTATGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID29', 'ACTGTACAGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID30', 'AGACTATACT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID31', 'AGCGTCGTCT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID32', 'AGTACGCTAT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID33', 'ATAGAGTACT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID34', 'CACGCTACGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID35', 'CAGTAGACGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID36', 'CGACGTGACT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID37', 'TACACACACT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID38', 'TACACGTGAT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID39', 'TACAGATCGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID40', 'TACGCTGTCT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID41', 'TAGTGTAGAT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID42', 'TCGATCACGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID43', 'TCGCACTAGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID44', 'TCTAGCGACT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID45', 'TCTATACTAT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID46', 'TGACGTATGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID47', 'TGTGAGTAGT', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID48', 'ACAGTATATA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID49', 'ACGCGATCGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID50', 'ACTAGCAGTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID51', 'AGCTCACGTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID52', 'AGTATACATA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID53', 'AGTCGAGAGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID54', 'AGTGCTACGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID55', 'CGATCGTATA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID56', 'CGCAGTACGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID57', 'CGCGTATACA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID58', 'CGTACAGTCA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID59', 'CGTACTCAGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID60', 'CTACGCTCTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID61', 'CTATAGCGTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID62', 'TACGTCATCA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID63', 'TAGTCGCATA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID64', 'TATATATACA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID65', 'TATGCTAGTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID66', 'TCACGCGAGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID67', 'TCGATAGTGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID68', 'TCGCTGCGTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID69', 'TCTGACGTCA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID70', 'TGAGTCAGTA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID71', 'TGTAGTGTGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID72', 'TGTCACACGA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID73', 'TGTCGTCGCA', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID74', 'ACACATACGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID75', 'ACAGTCGTGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID76', 'ACATGACGAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID77', 'ACGACAGCTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID78', 'ACGTCTCATC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID79', 'ACTCATCTAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID80', 'ACTCGCGCAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID81', 'AGAGCGTCAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID82', 'AGCGACTAGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID83', 'AGTAGTGATC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID84', 'AGTGACACAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID85', 'AGTGTATGTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID86', 'ATAGATAGAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID87', 'ATATAGTCGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID88', 'ATCTACTGAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID89', 'CACGTAGATC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID90', 'CACGTGTCGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID91', 'CATACTCTAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID92', 'CGACACTATC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID93', 'CGAGACGCGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID94', 'CGTATGCGAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID95', 'CGTCGATCTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID96', 'CTACGACTGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID97', 'CTAGTCACTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID98', 'CTCTACGCTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID99', 'CTGTACATAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID100', 'TAGACTGCAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID101', 'TAGCGCGCGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID102', 'TAGCTCTATC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID103', 'TATAGACATC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID104', 'TATGATACGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID105', 'TCACTCATAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID106', 'TCATCGAGTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID107', 'TCGAGCTCTC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID108', 'TCGCAGACAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID109', 'TCTGTCTCGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID110', 'TGAGTGACGC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID111', 'TGATGTGTAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID112', 'TGCTATAGAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID113', 'TGCTCGCTAC', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID114', 'ACGTGCAGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID115', 'ACTCACAGAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID116', 'AGACTCAGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID117', 'AGAGAGTGTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID118', 'AGCTATCGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID119', 'AGTCTGACTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID120', 'AGTGAGCTCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID121', 'ATAGCTCTCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID122', 'ATCACGTGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID123', 'ATCGTAGCAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID124', 'ATCGTCTGTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID125', 'ATGTACGATG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID126', 'ATGTGTCTAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID127', 'CACACGATAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID128', 'CACTCGCACG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID129', 'CAGACGTCTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID130', 'CAGTACTGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID131', 'CGACAGCGAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID132', 'CGATCTGTCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID133', 'CGCGTGCTAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID134', 'CGCTCGAGTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID135', 'CGTGATGACG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID136', 'CTATGTACAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID137', 'CTCGATATAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID138', 'CTCGCACGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID139', 'CTGCGTCACG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID140', 'CTGTGCGTCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID141', 'TAGCATACTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID142', 'TATACATGTG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID143', 'TATCACTCAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID144', 'TATCTGATAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID145', 'TCGTGACATG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID146', 'TCTGATCGAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID147', 'TGACATCTCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID148', 'TGAGCTAGAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID149', 'TGATAGAGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID150', 'TGCGTGTGCG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID151', 'TGCTAGTCAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID152', 'TGTATCACAG', 'GSMIDs');
INSERT INTO sequenceanalysis.barcodes (tag_name, sequence, group_name) VALUES ('MID153', 'TGTGCGCGTG', 'GSMIDs');
-- @SkipOnEmptySchemasEnd
-- ----------------------------
-- Table structure for sequenceAnalysis.ref_nt_sequences
-- ----------------------------
CREATE TABLE sequenceAnalysis.ref_nt_sequences
(
RowId serial NOT NULL,
name VARCHAR(220),
sequence text NOT NULL,
category1 VARCHAR(100), --aka Virus or DNA
category2 VARCHAR(100), --aka Strain or DNA_Region
category3 VARCHAR(100), --aka Locus
category4 VARCHAR(100), --aka Lineage
mol_type VARCHAR(100),
genbank VARCHAR(100),
ipd_accession VARCHAR(100),
species VARCHAR(100),
geographic_origin VARCHAR(200),
status BOOLEAN DEFAULT TRUE,
comments text DEFAULT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_ref_nt_sequences PRIMARY KEY (rowid)
);
-- ----------------------------
-- Data for sequenceAnalysis.ref_nt_sequences
-- ----------------------------
INSERT INTO sequenceanalysis.ref_nt_sequences
(name,category1,category2,mol_type,species,sequence)
VALUES
('SIVmac239', 'Virus', 'SIVmac239', 'RNA', 'SIV', 'GCATGCACATTTTAAAGGCTTTTGCTAAATATAGCCAAAAGTCCTTCTACAAATTTTCTAAGAGTTCTGATTCAAAGCAGTAACAGGCCTTGTCTCATCATGAACTTTGGCATTTCATCTACAGCTAAGTTTATATCATAAATAGTTCTTTACAGGCAGCACCAACTTATACCCTTATAGCATACTTTACTGTGTGAAAATTGCATCTTTCATTAAGCTTACTGTAAATTTACTGGCTGTCTTCCTTGCAGGTTTCTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATATACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTATTTAATGCATCCAGCTCAAACTTCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTGGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAAACAGCAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGCTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCTAGTGTGTGTTCCCATCTCTCCTAGCCGCCGCCTGGTCAACTCGGTACTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCAGATTGGCGCCTGAACAGGGACTTGAAGGAGAGTGAGAGACTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACCAACCACGACGGAGTGCTCCTATAAAGGCGCGGGTCGGTACCAGACGGCGTGAGGAGCGGGAGAGGAAGAGGCCTCCGGTTGCAGGTAAGTGCAACACAAAAAAGAAATAGCTGTCTTTTATCCAGGAAGGGGTAATAAGATAGAGTGGGAGATGGGCGTGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGCTACGACCCAACGGAAAGAAAAAGTACATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTAGATAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGATGTCAAAAAATACTTTCGGTCTTAGCTCCATTAGTGCCAACAGGCTCAGAAAATTTAAAAAGCCTTTATAATACTGTCTGCGTCATCTGGTGCATTCACGCAGAAGAGAAAGTGAAACACACTGAGGAAGCAAAACAGATAGTGCAGAGACACCTAGTGGTGGAAACAGGAACAACAGAAACTATGCCAAAAACAAGTAGACCAACAGCACCATCTAGCGGCAGAGGAGGAAATTACCCAGTACAACAAATAGGTGGTAACTATGTCCACCTGCCATTAAGCCCGAGAACATTAAATGCCTGGGTAAAATTGATAGAGGAAAAGAAATTTGGAGCAGAAGTAGTGCCAGGATTTCAGGCACTGTCAGAAGGTTGCACCCCCTATGACATTAATCAGATGTTAAATTGTGTGGGAGACCATCAAGCGGCTATGCAGATTATCAGAGATATTATAAACGAGGAGGCTGCAGATTGGGACTTGCAGCACCCACAACCAGCTCCACAACAAGGACAACTTAGGGAGCCGTCAGGATCAGATATTGCAGGAACAACTAGTTCAGTAGATGAACAAATCCAGTGGATGTACAGACAACAGAACCCCATACCAGTAGGCAACATTTACAGGAGATGGATCCAACTGGGGTTGCAAAAATGTGTCAGAATGTATAACCCAACAAACATTCTAGATGTAAAACAAGGGCCAAAAGAGCCATTTCAGAGCTATGTAGACAGGTTCTACAAAAGTTTAAGAGCAGAACAGACAGATGCAGCAGTAAAGAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCAGATTGCAAGCTAGTGCTGAAGGGGCTGGGTGTGAATCCCACCCTAGAAGAAATGCTGACGGCTTGTCAAGGAGTAGGGGGGCCGGGACAGAAGGCTAGATTAATGGCAGAAGCCCTGAAAGAGGCCCTCGCACCAGTGCCAATCCCTTTTGCAGCAGCCCAACAGAGGGGACCAAGAAAGCCAATTAAGTGTTGGAATTGTGGGAAAGAGGGACACTCTGCAAGGCAATGCAGAGCCCCAAGAAGACAGGGATGCTGGAAATGTGGAAAAATGGACCATGTTATGGCCAAATGCCCAGACAGACAGGCGGGTTTTTTAGGCCTTGGTCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCTCAAGTGCATCAGGGGCTGATGCCAACTGCTCCCCCAGAGGACCCAGCTGTGGATCTGCTAAAGAACTACATGCAGTTGGGCAAGCAGCAGAGAGAAAAGCAGAGAGAAAGCAGAGAGAAGCCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGGAGACCAGTAGTCACTGCTCATATTGAAGGACAGCCTGTAGAAGTATTACTGGATACAGGGGCTGATGATTCTATTGTAACAGGAATAGAGTTAGGTCCACATTATACCCCAAAAATAGTAGGAGGAATAGGAGGTTTTATTAATACTAAAGAATACAAAAATGTAGAAATAGAAGTTTTAGGCAAAAGGATTAAAGGGACAATCATGACAGGGGACACCCCGATTAACATTTTTGGTAGAAATTTGCTAACAGCTCTGGGGATGTCTCTAAATTTTCCCATAGCTAAAGTAGAGCCTGTAAAAGTCGCCTTAAAGCCAGGAAAGGATGGACCAAAATTGAAGCAGTGGCCATTATCAAAAGAAAAGATAGTTGCATTAAGAGAAATCTGTGAAAAGATGGAAAAGGATGGTCAGTTGGAGGAAGCTCCCCCGACCAATCCATACAACACCCCCACATTTGCTATAAAGAAAAAGGATAAGAACAAATGGAGAATGCTGATAGATTTTAGGGAACTAAATAGGGTCACTCAGGACTTTACGGAAGTCCAATTAGGAATACCACACCCTGCAGGACTAGCAAAAAGGAAAAGAATTACAGTACTGGATATAGGTGATGCATATTTCTCCATACCTCTAGATGAAGAATTTAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAGCCAGGAAAACGATACATTTATAAGGTTCTGCCTCAGGGATGGAAGGGGTCACCAGCCATCTTCCAATACACTATGAGACATGTGCTAGAACCCTTCAGGAAGGCAAATCCAGATGTGACCTTAGTCCAGTATATGGATGACATCTTAATAGCTAGTGACAGGACAGACCTGGAACATGACAGGGTAGTTTTACAGTCAAAGGAACTCTTGAATAGCATAGGGTTTTCTACCCCAGAAGAGAAATTCCAAAAAGATCCCCCATTTCAATGGATGGGGTACGAATTGTGGCCAACAAAATGGAAGTTGCAAAAGATAGAGTTGCCACAAAGAGAGACCTGGACAGTGAATGATATACAGAAGTTAGTAGGAGTATTAAATTGGGCAGCTCAAATTTATCCAGGTATAAAAACCAAACATCTCTGTAGGTTAATTAGAGGAAAAATGACTCTAACAGAGGAAGTTCAGTGGACTGAGATGGCAGAAGCAGAATATGAGGAAAATAAAATAATTCTCAGTCAGGAACAAGAAGGATGTTATTACCAAGAAGGCAAGCCATTAGAAGCCACGGTAATAAAGAGTCAGGACAATCAGTGGTCTTATAAAATTCACCAAGAAGACAAAATACTGAAAGTAGGAAAATTTGCAAAGATAAAGAATACACATACCAATGGAGTGAGACTATTAGCACATGTAATACAGAAAATAGGAAAGGAAGCAATAGTGATCTGGGGACAGGTCCCAAAATTCCACTTACCAGTTGAGAAGGATGTATGGGAACAGTGGTGGACAGACTATTGGCAGGTAACCTGGATACCGGAATGGGATTTTATCTCAACACCACCGCTAGTAAGATTAGTCTTCAATCTAGTGAAGGACCCTATAGAGGGAGAAGAAACCTATTATACAGATGGATCATGTAATAAACAGTCAAAAGAAGGGAAAGCAGGATATATCACAGATAGGGGCAAAGACAAAGTAAAAGTGTTAGAACAGACTACTAATCAACAAGCAGAATTGGAAGCATTTCTCATGGCATTGACAGACTCAGGGCCAAAGGCAAATATTATAGTAGATTCACAATATGTTATGGGAATAATAACAGGATGCCCTACAGAATCAGAGAGCAGGCTAGTTAATCAAATAATAGAAGAAATGATTAAAAAGTCAGAAATTTATGTAGCATGGGTACCAGCACACAAAGGTATAGGAGGAAACCAAGAAATAGACCACCTAGTTAGTCAAGGGATTAGACAAGTTCTCTTCTTGGAAAAGATAGAGCCAGCACAAGAAGAACATGATAAATACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGATTACCCAGAATAGTGGCCAGACAGATAGTAGACACCTGTGATAAATGTCATCAGAAAGGAGAGGCTATACATGGGCAGGCAAATTCAGATCTAGGGACTTGGCAAATGGATTGTACCCATCTAGAGGGAAAAATAATCATAGTTGCAGTACATGTAGCTAGTGGATTCATAGAAGCAGAGGTAATTCCACAAGAGACAGGAAGACAGACAGCACTATTTCTGTTAAAATTGGCAGGCAGATGGCCTATTACACATCTACACACAGATAATGGTGCTAACTTTGCTTCGCAAGAAGTAAAGATGGTTGCATGGTGGGCAGGGATAGAGCACACCTTTGGGGTACCATACAATCCACAGAGTCAGGGAGTAGTGGAAGCAATGAATCACCACCTGAAAAATCAAATAGATAGAATCAGGGAACAAGCAAATTCAGTAGAAACCATAGTATTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAATTAACATGATCACTACAGAACAAGAGATACAATTTCAACAATCAAAAAACTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAACTGTGGAAGGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCTTAAAGGTAGGGACAGACATTAAGGTAGTACCCAGAAGAAAGGCTAAAATTATCAAAGATTATGGAGGAGGAAAAGAGGTGGATAGCAGTTCCCACATGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATAAAATATCTGAAATATAAAACTAAAGATCTACAAAAGGTTTGCTATGTGCCCCATTTTAAGGTCGGATGGGCATGGTGGACCTGCAGCAGAGTAATCTTCCCACTACAGGAAGGAAGCCATTTAGAAGTACAAGGGTATTGGCATTTGACACCAGAAAAAGGGTGGCTCAGTACTTATGCAGTGAGGATAACCTGGTACTCAAAGAACTTTTGGACAGATGTAACACCAAACTATGCAGACATTTTACTGCATAGCACTTATTTCCCTTGCTTTACAGCGGGAGAAGTGAGAAGGGCCATCAGGGGAGAACAACTGCTGTCTTGCTGCAGGTTCCCGAGAGCTCATAAGTACCAGGTACCAAGCCTACAGTACTTAGCACTGAAAGTAGTAAGCGATGTCAGATCCCAGGGAGAGAATCCCACCTGGAAACAGTGGAGAAGAGACAATAGGAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAGGAGATAAACAGAGAGGCGGTAAACCACCTACCAAGGGAGCTAATTTTCCAGGTTTGGCAAAGGTCTTGGGAATACTGGCATGATGAACAAGGGATGTCACCAAGCTATGTAAAATACAGATACTTGTGTTTAATACAAAAGGCTTTATTTATGCATTGCAAGAAAGGCTGTAGATGTCTAGGGGAAGGACATGGGGCAGGGGGATGGAGACCAGGACCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAATGGAAGAAAGACCTCCAGAAAATGAAGGACCACAAAGGGAACCATGGGATGAATGGGTAGTGGAGGTTCTGGAAGAACTGAAAGAAGAAGCTTTAAAACATTTTGATCCTCGCTTGCTAACTGCACTTGGTAATCATATCTATAATAGACATGGAGACACCCTTGAGGGAGCAGGAGAACTCATTAGAATCCTCCAACGAGCGCTCTTCATGCATTTCAGAGGCGGATGCATCCACTCCAGAATCGGCCAACCTGGGGGAGGAAATCCTCTCTCAGCTATACCGCCCTCTAGAAGCATGCTATAACACATGCTATTGTAAAAAGTGTTGCTACCATTGCCAGTTTTGTTTTCTTAAAAAAGGCTTGGGGATATGTTATGAGCAATCACGAAAGAGAAGAAGAACTCCGAAAAAGGCTAAGGCTAATACATCTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCCATCTTGCTTTTAAGTGTCTATGGGATCTATTGTACTCTATATGTCACAGTCTTTTATGGTGTACCAGCTTGGAGGAATGCGACAATTCCCCTCTTTTGTGCAACCAAGAATAGGGATACTTGGGGAACAACTCAGTGCCTACCAGATAATGGTGATTATTCAGAAGTGGCCCTTAATGTTACAGAAAGCTTTGATGCCTGGAATAATACAGTCACAGAACAGGCAATAGAGGATGTATGGCAACTCTTTGAGACCTCAATAAAGCCTTGTGTAAAATTATCCCCATTATGCATTACTATGAGATGCAATAAAAGTGAGACAGATAGATGGGGATTGACAAAATCAATAACAACAACAGCATCAACAACATCAACGACAGCATCAGCAAAAGTAGACATGGTCAATGAGACTAGTTCTTGTATAGCCCAGGATAATTGCACAGGCTTGGAACAAGAGCAAATGATAAGCTGTAAATTCAACATGACAGGGTTAAAAAGAGACAAGAAAAAAGAGTACAATGAAACTTGGTACTCTGCAGATTTGGTATGTGAACAAGGGAATAACACTGGTAATGAAAGTAGATGTTACATGAACCACTGTAACACTTCTGTTATCCAAGAGTCTTGTGACAAACATTATTGGGATGCTATTAGATTTAGGTATTGTGCACCTCCAGGTTATGCTTTGCTTAGATGTAATGACACAAATTATTCAGGCTTTATGCCTAAATGTTCTAAGGTGGTGGTCTCTTCATGCACAAGGATGATGGAGACACAGACTTCTACTTGGTTTGGCTTTAATGGAACTAGAGCAGAAAATAGAACTTATATTTACTGGCATGGTAGGGATAATAGGACTATAATTAGTTTAAATAAGTATTATAATCTAACAATGAAATGTAGAAGACCAGGAAATAAGACAGTTTTACCAGTCACCATTATGTCTGGATTGGTTTTCCACTCACAACCAATCAATGATAGGCCAAAGCAGGCATGGTGTTGGTTTGGAGGAAAATGGAAGGATGCAATAAAAGAGGTGAAGCAGACCATTGTCAAACATCCCAGGTATACTGGAACTAACAATACTGATAAAATCAATTTGACGGCTCCTGGAGGAGGAGATCCGGAAGTTACCTTCATGTGGACAAATTGCAGAGGAGAGTTCCTCTACTGTAAAATGAATTGGTTTCTAAATTGGGTAGAAGATAGGAATACAGCTAACCAGAAGCCAAAGGAACAGCATAAAAGGAATTACGTGCCATGTCATATTAGACAAATAATCAACACTTGGCATAAAGTAGGCAAAAATGTTTATTTGCCTCCAAGAGAGGGAGACCTCACGTGTAACTCCACAGTGACCAGTCTCATAGCAAACATAGATTGGATTGATGGAAACCAAACTAATATCACCATGAGTGCAGAGGTGGCAGAACTGTATCGATTGGAATTGGGAGATTATAAATTAGTAGAGATCACTCCAATTGGCTTGGCCCCCACAGATGTGAAGAGGTACACTACTGGTGGCACCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCAACGGCAGGTTCTGCAATGGGCGCGGCGTCGTTGACGCTGACCGCTCAGTCCCGAACTTTATTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGACGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACAAAGAACCTCCAGACTAGGGTCACTGCCATCGAGAAGTACTTAAAGGACCAGGCGCAGCTGAATGCTTGGGGATGTGCGTTTAGACAAGTCTGCCACACTACTGTACCATGGCCAAATGCAAGTCTAACACCAAAGTGGAACAATGAGACTTGGCAAGAGTGGGAGCGAAAGGTTGACTTCTTGGAAGAAAATATAACAGCCCTCCTAGAGGAGGCACAAATTCAACAAGAGAAGAACATGTATGAATTACAAAAGTTGAATAGCTGGGATGTGTTTGGCAATTGGTTTGACCTTGCTTCTTGGATAAAGTATATACAATATGGAGTTTATATAGTTGTAGGAGTAATACTGTTAAGAATAGTGATCTATATAGTACAAATGCTAGCTAAGTTAAGGCAGGGGTATAGGCCAGTGTTCTCTTCCCCACCCTCTTATTTCCAGCAGACCCATATCCAACAGGACCCGGCACTGCCAACCAGAGAAGGCAAAGAAAGAGACGGTGGAGAAGGCGGTGGCAACAGCTCCTGGCCTTGGCAGATAGAATATATTCATTTCCTGATCCGCCAACTGATACGCCTCTTGACTTGGCTATTCAGCAACTGCAGAACCTTGCTATCGAGAGTATACCAGATCCTCCAACCAATACTCCAGAGGCTCTCTGCGACCCTACAGAGGATTCGAGAAGTCCTCAGGACTGAACTGACCTACCTACAATATGGGTGGAGCTATTTCCATGAGGCGGTCCAGGCCGTCTGGAGATCTGCGACAGAGACTCTTGCGGGCGCGTGGGGAGACTTATGGGAGACTCTTAGGAGAGGTGGAAGATGGATACTCGCAATCCCCAGGAGGATTAGACAAGGGCTTGAGCTCACTCTCTTGTGAGGGACAGAAATACAATCAGGGACAGTATATGAATACTCCATGGAGAAACCCAGCTGAAGAGAGAGAAAAATTAGCATACAGAAAACAAAATATGGATGATATAGATGAGgAAGATGATGACTTGGTAGGGGTATCAGTGAGGCCAAAAGTTCCCCTAAGAACAATGAGTTACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATATACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTATTTAATGCATCCAGCTCAAACTTCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTGGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAAACAGCAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGCTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCTAGTGTGTGTTCCCATCTCTCCTAGCCGCCGCCTGGTCAACTCGGTACTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCA'),
('SIVmac251', 'Virus', 'SIVmac251', 'RNA', 'SIV', 'TGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATGTACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGAGGCATTATTTAATGCAGCCAGCTCAAACTTCCAAGTGGGATGACCCTTGGGGAGAGGTTCTAGCGTGGAAGTTTGATCCAACTCTAGCCTACACTTATGAGGCATATGCTAGATACCCAGAAGAGTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAGGGAAACTCGCTGAGATAGCAGGGACTTTCCACAAGGGGATGTTATGGGGAGGAGCCGGTCGGGAACACCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCAGTGCTGGGCAGAGTGGCTCCACGCTTGCTTGCTTAAAGACCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCCAGTGTGTGTTCCCATCTCTCCTAGTCGCCGCCTGGTCAACTCGGTACTCGGTAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGAGAAACCGAAGCAGGAAAATCCCTAGCAGATTGGCGCCCGAACAGGACTTGAAGGAGAGTGAGAGACTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACCAACCACGACGGAGTGCTCCTATAAAGGCGCGGGTCGGTACCAGACGGCGTGAGGAGCGGGAGAGGAGGAGGCCTCCGGTTGCAGGTAAGTGCAACACAAAAAAGAAATAGCTGTCTTGTTATCCAGGAAGGGATAATAAGATAGAGTGGGAGATGGGCGCGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGCTACGACCCGGCGGAAAGAAAAAGTACATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTAGATAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGATGTCAAAAAATACTTTCGGTCTTAGCTCCATTAGTGCCAACAGGCTCAGAAAATTTAAAAAGCCTTTATAATACTGTCTGCGTCATCTGGTGCATTCACGCAGAAGAGAAAGTGAAACACACTGAGGAAGCAAAACAGATAGTGCAGAGACACCTAGTGGTGGAAACAGGAACAGCAGAAACTATGCCAAAAACAAGTAGACCAACAGCACCATCTAGCGGCAGAGGAGGAAATTACCCAGTACAACAAATAGGTGGTAACTATGTCCACCTGCCATTAAGCCCGAGAACATTAAATGCCTGGGTAAAATTGATAGAGGAAAAGAAATTTGGAGCAGAAGTAGTGCCAGGATTTCAGGCACTGTCAGAAGGCTGCACCCCCTATGACATTAATCAGATGTTAAATTGTGTGGGAGACCATCAAGCGGCTATGCAGATTATCAGAGATATTATAAATGAGGAGGCTGCAGATTGGGACTTGCAGCACCCACAACCAGCTCCACAACAAGGACAGCTTAGGGAGCCGTCAGGATCAGATATTGCAGGAACAACTAGTTCAGTAGATGAACAAATCCAGTGGATGTACAGACAACAGAACCCCATACCAGTAGGCAACATTTACAGGAGATGGATCCAACTGGGGTTGCAAAAATGTGTCAGAATGTATAACCCAACAAACATTCTAGATGTAAAACAAGGGCCAAAAGAGCCATTTCAGAGCTATGTAGACAGGTTCTACAAAAGCTTAAGAGCAGAACAAACAGATGCAGCAGTAAAGAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCAGATTGCAAGCTAGTGCTGAAGGGGCTGGGTGTGAATCCCACCCTAGAAGAAATGCTGACGGCTTGTCAAGGAGTAGGGGGACCAGGACAGAAGGCTAGATTAATGGCAGAAGCCCTGAAAGAGGCCCTCGCACCAGTGCCAATCCCTTTTGCAGCAGCCCAGAAGAGGGGACCAAGAAAGCCAATTAAGTGTTGGAATTGTGGGAAGGAGGGACACTCTGCAAGGCAATGCAGAGCCCCAAGAAGACAGGGATGCTGGAAATGTGGAAAAATGGACCATGTTATGGCCAAATGCCCAGACAGACAGGCGGGTTTTTTAGGCCTTGGTCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCTCAAGTGCATCAGGGGCTGACGCCAACTGCTCCCCCAGAGGACCCAGCTGTGGATCTGCTAAAGAACTACATGCAGTTGGGCAAGCAGCAGAGAGAAAGCAGAGAGAAGCCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGGAGACCAGTAGTCACTGCTCATATTGAAGGACAGCCTGTAGAAGTATTATTGGATACAGGGGCTGATGATTCTATTGTAACAGGAATAGAGTTAGGTCCACATTATACCCCAAAAATAGTAGGAGGAATAGGAGGTTTTATTAATACTAAAGAATACAAAAATGTAAAAATAGAAGTTTTAGGCAAAAGGATTAAAGGGACAATCATGACAGGGGACACTCCGATTAACATTTTTGGTAGGAATTTGCTAACAGCTCTGGGGATGTCTCTAAATCTTCCCATAGCTAAGGTAGAGCCTGTAAAAGTCACCTTAAAGCCAGGAAAGGTTGGACCAAAATTGAAGCAGTGGCCATTATCAAAAGAAAAGATAGTTGCATTAAGAGAAATCTGTGAAAAGATGGAAAAGGATGGTCAGTTGGAGGAAGCTCCCCCGACCAATCCATACAACACCCCCACATTTGCCATAAAGAAAAAAGATAAGAACAAATGGAGAATGCTGATAGATTTTAGGGAACTAAATAGGGTCACTCAGGACTTTACAGAAGTCCAATTAGGAATACCACACCCTGCAGGACTAGCAAAAAGGAAAAGGATTACAGTACTGGATATAGGTGATGCATATTTCTCCATACCTCTAGATGAAGAATTTAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAGCCAGGAAAACGATACATTTATAAGGTTCTGCCTCAGGGATGGAAGGGGTCACCAGCCATCTTCCAATACACTATGAGACATGTGCTAGAACCCTTCAGGAAGGCAAATCCAGATGTGACCTTAGTCCAGTATATGGATGACATCTTAATAGCTAGTGACAGGACAGACCTGGAACATGACAGGGTAGTTTTACAGCTAAAGGAACTCTTAAATAGCATAGGGTTCTCTACCCCAGAAGAGAAATTCCAAAAAGATCCCCCATTTCAATGGATGGGGTACGAATTGTGGCCGACAAAATGGAAGTTGCAAAAGATAGAGTTGCCACAAAGAGAGACCTGGACAGTGAATGATATACAGAAGTTAGTAGGAGTATTAAATTGGGCAGCTCAAATTTATCCAGGTATAAAAACCAAACATCTCTGTAGGTTAATTAGAGGAAAAATGACTCTAACAGAGGAAGTTCAGTGGACTGAGATGGCAGAAGCAGAATATGAGGAAAATAAGATAATTCTCAGTCAGGAACAAGAAGGATGTTATTACCAAGAAGGCAAGCCATTAGAAGCCACGGTAATAAAGAGTCAGGACAATCAGTGGTCTTATAAAATTCACCAAGAAGACAAAATACTGAAAGTAGGAAAATTTGCAAAGATAAAGAATACACATACCAATGGAGTTAGACTATTAGCACATGTAATACAGAAAATAGGAAAGGAAGCAATAGTGATCTGGGGACAGGTCCCAAAATTCCACTTACCAGTTGAGAGGGATGTATGGGAACAGTGGTGGACAGACTATTGGCAGGTAACCTGGATACCGGAGTGGGATTTTATCTCAACGCCACCACTAGTAAGATTAGTCTTCAATCTAGTGAAGGACCCTATAGAGGGAGAAGAAACCTATTATACAGATGGATCATGTAATAAACAGTCAAAAGAAGGGAAAGCAGGATATATCACAGATAGGGGCAAAGACAAAGTAAAAGTGTTAGAACAGACTACTAATCAACAAGCAGAATTAGAAGCATTTCTCATGGCATTGACAGACTCAGGGCCAAAGACAAATATTATAGTAGATTCACAATATGTTATGGGAATAATAACAGGATGCCCTACAGAATCAGAGAGCAGGCTAGTTAACCAAATAATAGAAGAAATGATTAAAAAGTCAGAAATTTATGTAGCATGGGTACCAGCACACAAAGGTATAGGAGGAAACCAAGAAATAGACCACCTAGTTAGTCAGGGGATTAGACAAGTTCTCTTCTTGGAAAAGATAGAGCCAGCACAAGAAGAACATGATAAATACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGATTACCCAGAATAGTGGCCAGACAGATAGTAGACACCTGTGATAAATGTCATCAGAAAGGAGAAGCTATACATGGGCAGGTAAATTCAGATCTAGGGACTTGGCAAATGGACTGTACCCATCTAGAAGGAAAAATAGTCATAGTTGCAGTACATGTAGCTAGTGGATTCATAGAAGCAGAAGTAATTCCACAAGAGACAGGAAGACAGACAGCACTATTTCTGTTAAAATTGGCAGGCAGATGGCCTATTACACATCTACACACAGATAATGGTGCTAACTTTGCCTCGCAAGAAGTAAAGATGGTTGCATGGTGGGCAGGGATAGAGCACACCTTTGGGGTACCATACAATCCACAGAGTCAGGGAGTAGTGGAAGCAATGAATCACCACCTGAAAAATCAAATAGATAGAATCAGGGAACAAGCAAATTCAGTAGAAACCATAGTATTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAATTAACATGATCACTACAGAACAAGAAATACAATTTCAACAATCAAAAAACTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAACTGTGGAAGGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCTTAAAGGTAGGGACAGACATTAAGGTAGTACCCAGAAGAAAGGCTAAAATTATCAAAGATTATGGAGGAGGAAAAGAGGTGGATAGCAGTTCCCACATGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATAAAATATCTGAAATATAAAACTAAAGATCTACAAAAGGTTTGCTATGTGCCCCATTTTAAGGTCGGATGGGCATGGTGGACCTGCAGCAGAGTAATCTTCCCCCTACAGGAAGGAAGCCATTTAGAAGTACAAGGGTATTGGCATTTGACACCAGAAAGAGGGTGGCTCAGTACTTATGCAGTGAGGATAACCTGGTACTCAAGGAACTTTTGGACAGATGTAACACCAGACTATGCAGACATTTTACTGCATAGCACTTATTTCCCTTGCTTTACAGCGGGAGAAGTGAGAAGGGCCATCAGGGGAGAACAACTGCTGTCTTGCTGCAAGTTCCCGAGAGCTCATAGGTACCAGGTACCAAGCCTACAGTACTTAGCACTAAAAGTAGTAAGCGATGTCAGATCCCAGGGAGAGAATCCCACCTGGAAACAGTGGAGAAGAGACAATAGGAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAGGAGATAAACAGAGAGGCAGTAAACCACCTACCAAGGGAGCTGATTTTCCAGGTTTGGCAAAGGTCTTGGGAATACTGGCATGATGAACAAGGGATGTCACAAAGCTATGTAAAATACAGATACTTGTGTTTAATGCAAAAGGCTTTATTTATGCATTGCAAGAAAGGCTGTAGATGTCTAGGGGAAGGACACGGGGCAGGAGGATGGAGACCAGGACCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAATGGAAGAAAGACCTCCAGAAAATGAAGGCCCACAAAGGGAACCATGGGATGAATGGGTAGTGGAGGTTCTGGAAGAATTGAAAGAAGAAGCTTTAAAACATTTTGATCCTCGCTTGCTAACTGCACTTGGTAATCATATCTATAATAGACATGGAGACACCCTTGAGGGAGCAGGAGAACTCATTAGAATCCTCCAACGAGCGCTCTTCATGCATTTTAGAGGCGGATGCAACCACTCCAGAATCGGCCAACCTGGGGGAGGAAATCCTCTCTCAACTATACCGCCCTCTTGAGGCGTGCTATAACACATGCTATTGTAAAAAGTGTTGCTACCATTGCCAGTTTTGTTTTCTTAAAAAGGGATTGGGGATATGTTATGAGCAGTCACGAAAGAGAAGAAGAACTCCGAAAAAGGCTAAGGCTAATACATCTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCCATCTTGCTTTTAAGTGTCTATGGGATCTATTGTACTCAATATGTCACAGTCTTTTATGGTGTACCAGCTTGGAGGAATGCGACAATTCCCCTCTTCTGTGCAACCAAGAATAGGGATACTTGGGGAACAACTCAGTGCCTACCAGATAATGGTGATTATTCAGAATTGGCCCTTAATGTTACAGAAAGCTTTGATGCTTGGGAGAATACAGTCACAGAACAGGCAATAGAGGACGTATGGCAACTCTTTGAGACCTCAATAAAGCCTTGTGTAAAATTATCCCCATTATGCATTACTATGAGATGCAATAAAAGTGAGACAGATAGATGGGGATTGACAAAATCATCAACAACAATAACAACAGCAGCACCAACATCAGCACCAGTATCAGAAAAAATAGACATGGTCAATGAGACTAGTTCTTGTATAGCTCAGAATAATTGCACAGGCTTGGAACAAGAGCAAATGATAAGCTGTAAATTCACCATGACAGGGTTAAAAAGAGACAAGACAAAGGAGTACAATGAAACTTGGTACTCTACAGATTTGGTTTGTGAACAAGGGAATAGCACTGATAATGAAAGCAGATGCTACATGAATCACTGTAACACTTCTGTTATCCAAGAATCTTGTGACAAACATTATTGGGATACTATTAGATTTAGGTATTGTGCACCTCCAGGTTATGCTTTGCTTAGATGTAATGACACAAATTATTCAGGCTTTATGCCTAAATGTTCTAAGGTGGTGGTCTCTTCATGCACAAGGATGATGGAGACACAGACTTCTACTTGGTTTGGCTTTAATGGAACTAGAGCAGAAAATAGAACTTATATTTACTGGCATGGTAGGGATAATAGGACTATAATTAGTTTAAATAAGTATTATAATCTAACAATGAAATGTAGAAGACCAGGAAATAAGACAGTTTTACCAGTCACCATTATGTCTGGATTGGTTTTCCACTCACAACCAATCAATGATAGGCCAAAGCAGGCATGGTGTTGGTTTGGAGGAAAATGGAAGGATGCAATAAAAGAGGTGAAACAGACCATTGTCAAACATCCCAGGTATACTGGAACTAACAATACTGATAAAATCAATTTAACGGCTCCTGGAGGAGGAGATCCGGAAGTTACCTTCATGTGGACAAATTGCAGAGGAGAGTTCCTCTACTGTAAAATGAATTGGTTTCTAAATTGGGTAGAGGATAGGGATGTAACTACCCAGAGGCCAAAGGAACGGCATAGAAGGAATTACGTGCCGTGTCATATTAGACAAATAATCAACACTTGGCATAAAGTAGGCAAAAATGTTTATTTGCCTCCAAGAGAGGGAGACCTCACGTGTAACTCCACAGTGACCAGTCTCATAGCAAACATAGATTGGACTGATGGAAACCAAACTAGTATCACCATGAGTGCAGAGGTGGCAGAACTGTATCGATTGGAGTTGGGAGATTATAAATTAGTAGAGATCACTCCGATTGGCTTGGCCCCCACAGATGTGAAGAGGTACACTACTGGTGGCACCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCAACGGCAGGTTCTGCAATGGGCGCGGCGTCGTTGACGCTGACCGCTCAGTCCCGGACTTTATTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGACGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACAAAGAACCTCCAGACTAGGGTCACTGCCATCGAGAAGTACTTAAAGGACCAGGCGCAGCTAAATGCTTGGGGATGTGCGTTTAGACAAGTCTGCCACACTACTGTACCATGGCCAAATGCAAGTCTAACACCAGACTGGAACAATGATACTTGGCAAGAGTGGGAGCGAAAGGTTGACTTCTTGGAGGAAAATATAACAGCCCTCCTAGAAGAGGCACAAATTCAACAAGAGAAGAACATGTATGAATTACAAAAGTTGAATAGCTGGGATGTGTTTGGCAATTGGTTTGACCTTGCTTCTTGGATAAAGTATATACAATATGGAATTTATGTAGTTGTAGGAGTAATACTGTTAAGAATAGTGATCTATATAGTACAAATGCTAGCTAAGTTAAGGCAGGGGTATAGGCCAGTGTTCTCTTCCCCACCCTCTTATTTCCAGTAGACTCATACCCAACAGGACCCGGCACTGCCAACCAGAGAAGGCAAAGAAGGAGACGGTGGAGAAGGCGGTGGCAACAGCTCCTGGCCTTGGCAGATAGAATATATTCATTTCCTGATCCGCCAACTGATACGCCTCTTGACTTGGCTATTCAGCAACTGCAGAACCTTGCTATCGAGAGCATACCAGATCCTCCAACCAATACTCCAGAGGCTCTCTGCGACCCTACGAAGGGTTCGAGAAGTCCTCAGGACTGAACTGACCTACCTACAATATGGGTGGAGCTATTTCCATGAGGCGGTCCAAGCCGGCTGGAGATCTGCGACAGAAACTCTTGCGGGCGCGTGGAGAGACTTATGGGAGACTCTTAGGAGAGGTGGAAGATGGATCCTCGCAATCCCTAGGAGGATTAGGCAAGGGCTTGAGCTCACGCTCTTGTGAGGGACAGAAATACAATCAGGGGCAGTATATGAATACTCCATGGAGAAACCCAGCTGAAGAAAAAGAAAAATTAGCATACAGAAAACAAAATATGGATGATATAGATGAGGAAGATGATGACTTGGTAGGGGTATCAGTGAGGCCAAAAGTTCCCCTAAGAGCAATGACTTACAAATTGGCAATAGATATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATGTACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGAGGCATTATTTAATGCAGCCAGCTCAAACTTCCAAGTGGGATGACCCTTGGGGAGAGGTTCTAGCGTGGAAGTTTGATCCAACTCTAGCCTACACTTATGAGGCATATGCTAGATACCCAGAAGAGTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAGGGAAACTCGCTGAGATAGCAGGGACTTTCCACAAGGGGATGTTATGGGGAGGAGCCGGTCGGGAACACCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCAGTGCTGGGCAGAGTGGCTCCACGCTTGCTTGCTTAAAGACCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCCAGTGTGTGTTCCCATCTCTCCTAGTCGCCGCCTGGTCAACTCGGTACTCGGTAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGAGAAACCGAAGCAGGAAAATCCCTAGCATGAAGATGGACTAATATAGGAGAGACCT'),
('SHIV89.6P', 'Virus', 'SHIV89.6P', 'RNA', 'SIV', 'CAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGTTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCTAGTGTGTGTTCCCATCTCTCCTAGCCGCCGCCTGGTCAACTCGGTACTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCAGATTGGCGCCTGAACAGGGACTTGAAGGAGAGTGAGAGACTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACCAACCACGACGGAGTGCTCCTATAAAGGCGCGGGTCGGTACCAGACGGCGTGAGGAGCGGGAGAGGAAGAGGCCTCCGGTTGCAGGTAAGTGCAACACAAAAAAGAAATAGCTGTCTTTTATCCAGGAAGGGGTAATAAGATAGAGTGGGAGATGGGCGTGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGCTACGACCCAACGGAAAGAAAAAGTACATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTAGATAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGATGTCAAAAAATACTTTCGGTCTTAGCTCCATTAGTGCCAACAGGCTCAGAAAATTTAAAAAGCCTTTATAATACTGTCTGCGTCATCTGGTGCATTCACGCAGAAGAGAAAGTGAAACACACTGAGGAAGCAAAACAGATAGTGCAGAGACACCTAGTGGTGGAAACAGGAACAACAGAAACTATGCCAAAAACAAGTAGACCAACAGCACCATCTAGCGGCAGAGGAGGAAATTACCCAGTACAACAAATAGGTGGTAACTATGTCCACCTGCCATTAAGCCCGAGAACATTAAATGCCTGGGTAAAATTGATAGAGGAAAAGAAATTTGGAGCAGAAGTAGTGCCAGGATTTCAGGCACTGTCAGAAGGTTGCACCCCCTATGACATTAATCAGATGTTAAATTGTGTGGGAGACCATCAAGCGGCTATGCAGATTATCAGAGATATTATAAACGAGGAGGCTGCAGATTGGGACTTGCAGCACCCACAACCAGCTCCACAACAAGGACAACTTAGGGAGCCGTCAGGATCAGATATTGCAGGAACAACTAGTTCAGTAGATGAACAAATCCAGTGGATGTACAGACAACAGAACCCCATACCAGTAGGCAACATTTACAGGAGATGGATCCAACTGGGGTTGCAAAAATGTGTCAGAATGTATAACCCAACAAACATTCTAGATGTAAAACAAGGGCCAAAAGAGCCATTTCAGAGCTATGTAGACAGGTTCTACAAAAGTTTAAGAGCAGAACAGACAGATGCAGCAGTAAAGAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCAGATTGCAAGCTAGTGCTGAAGGGGCTGGGTGTGAATCCCACCCTAGAAGAAATGCTGACGGCTTGTCAAGGAGTAGGGGGGCCGGGACAGAAGGCTAGATTAATGGCAGAAGCCCTGAAAGAGGCCCTCGCACCAGTGCCAATCCCTTTTGCAGCAGCCCAACAGAGGGGACCAAGAAAGCCAATTAAGTGTTGGAATTGTGGGAAAGAGGGACACTCTGCAAGGCAATGCAGAGCCCCAAGAAGACAGGGATGCTGGAAATGTGGAAAAATGGACCATGTTATGGCCAAATGCCCAGACAGACAGGCGGGTTTTTTAGGCCTTGGTCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCTCAAGTGCATCAGGGGCTGATGCCAACTGCTCCCCCAGAGGACCCAGCTGTGGATCTGCTAAAGAACTACATGCAGTTGGGCAAGCAGCAGAGAGAAAAGCAGAGAGAAAGCAGAGAGAAGCCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGGAGACCAGTAGTCACTGCTCATATTGAAGGACAGCCTGTAGAAGTATTACTGGATACAGGGGCTGATGATTCTATTGTAACAGGAATAGAGTTAGGTCCACATTATACCCCAAAAATAGTAGGAGGAATAGGAGGTTTTATTAATACTAAAGAATACAAAAATGTAGAAATAGAAGTTTTAGGCAAAAGGATTAAAGGGACAATCATGACAGGGGACACCCCGATTAACATTTTTGGTAGAAATTTGCTAACAGCTCTGGGGATGTCTCTAAATTTTCCCATAGCTAAAGTAGAGCCTGTAAAAGTCGCCTTAAAGCCAGGAAAGGATGGACCAAAATTGAAGCAGTGGCCATTATCAAAAGAAAAGATAGTTGCATTAAGAGAAATCTGTGAAAAGATGGAAAAGGATGGTCAGTTGGAGGAAGCTCCCCCGACCAATCCATACAACACCCCCACATTTGCTATAAAGAAAAAGGATAAGAACAAATGGAGAATGCTGATAGATTTTAGGGAACTAAATAGGGTCACTCAGGACTTTACGGAAGTCCAATTAGGAATACCACACCCTGCAGGACTAGCAAAAAGGAAAAGAATTACAGTACTGGATATAGGTGATGCATATTTCTCCATACCTCTAGATGAAGAATTTAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAGCCAGGAAAACGATACATTTATAAGGTTCTGCCTCAGGGATGGAAGGGGTCACCAGCCATCTTCCAATACACTATGAGACATGTGCTAGAACCCTTCAGGAAGGCAAATCCAGATGTGACCTTAGTCCAGTATATGGATGACATCTTAATAGCTAGTGACAGGACAGACCTGGAACATGACAGGGTAGTTTTACAGTCAAAGGAACTCTTGAATAGCATAGGGTTTTCTACCCCAGAAGAGAAATTCCAAAAAGATCCCCCATTTCAATGGATGGGGTACGAATTGTGGCCAACAAAATGGAAGTTGCAAAAGATAGAGTTGCCACAAAGAGAGACCTGGACAGTGAATGATATACAGAAGTTAGTAGGAGTATTAAATTGGGCAGCTCAAATTTATCCAGGTATAAAAACCAAACATCTCTGTAGGTTAATTAGAGGAAAAATGACTCTAACAGAGGAAGTTCAGTGGACTGAGATGGCAGAAGCAGAATATGAGGAAAATAAAATAATTCTCAGTCAGGAACAAGAAGGATGTTATTACCAAGAAGGCAAGCCATTAGAAGCCACGGTAATAAAGAGTCAGGACAATCAGTGGTCTTATAAAATTCACCAAGAAGACAAAATACTGAAAGTAGGAAAATTTGCAAAGATAAAGAATACACATACCAATGGAGTGAGACTATTAGCACATGTAATACAGAAAATAGGAAAGGAAGCAATAGTGATCTGGGGACAGGTCCCAAAATTCCACTTACCAGTTGAGAAGGATGTATGGGAACAGTGGTGGACAGACTATTGGCAGGTAACCTGGATACCGGAATGGGATTTTATCTCAACACCACCGCTAGTAAGATTAGTCTTCAATCTAGTGAAGGACCCTATAGAGGGAGAAGAAACCTATTATACAGATGGATCATGTAATAAACAGTCAAAAGAAGGGAAAGCAGGATATATCACAGATAGGGGCAAAGACAAAGTAAAAGTGTTAGAACAGACTACTAATCAACAAGCAGAATTGGAAGCATTTCTCATGGCATTGACAGACTCAGGGCCAAAGGCAAATATTATAGTAGATTCACAATATGTTATGGGAATAATAACAGGATGCCCTACAGAATCAGAGAGCAGGCTAGTTAATCAAATAATAGAAGAAATGATTAAAAAGTCAGAAATTTATGTAGCATGGGTACCAGCACACAAAGGTATAGGAGGAAACCAAGAAATAGACCACCTAGTTAGTCAAGGGATTAGACAAGTTCTCTTCTTGGAAAAGATAGAGCCAGCACAAGAAGAACATGATAAATACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGATTACCCAGAATAGTGGCCAGACAGATAGTAGACACCTGTGATAAATGTCATCAGAAAGGAGAGGCTATACATGGGCAGGCAAATTCAGATCTAGGGACTTGGCAAATGGATTGTACCCATCTAGAGGGAAAAATAATCATAGTTGCAGTACATGTAGCTAGTGGATTCATAGAAGCAGAGGTAATTCCACAAGAGACAGGAAGACAGACAGCACTATTTCTGTTAAAATTGGCAGGCAGATGGCCTATTACACATCTACACACAGATAATGGTGCTAACTTTGCTTCGCAAGAAGTAAAGATGGTTGCATGGTGGGCAGGGATAGAGCACACCTTTGGGGTACCATACAATCCACAGAGTCAGGGAGTAGTGGAAGCAATGAATCACCACCTGAAAAATCAAATAGATAGAATCAGGGAACAAGCAAATTCAGTAGAAACCATAGTATTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAATTAACATGATCACTACAGAACAAGAGATACAATTTCAACAATCAAAAAACTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAACTGTGGAAGGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCTTAAAGGTAGGGACAGACATTAAGGTAGTACCCAGAAGAAAGGCTAAAATTATCAAAGATTATGGAGGAGGAAAAGAGGTGGATAGCAGTTCCCACATGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATAAAATATCTGAAATATAAAACTAAAGATCTACAAAAGGTTTGCTATGTGCCCCATTTTAAGGTCGGATGGGCATGGTGGACCTGCAGCAGAGTAATCTTCCCACTACAGGAAGGAAGCCATTTAGAAGTACAAGGGTATTGGCATTTGACACCAGAAAAAGGGTGGCTCAGTACTTATGCAGTGAGGATAACCTGGTACTCAAAGAACTTTTGGACAGATGTAACACCAAACTATGCAGACATTTTACTGCATAGCACTTATTTCCCTTGCTTTACAGCGGGAGAAGTGAGAAGGGCCATCAGGGGAGAACAACTGCTGTCTTGCTGCAGGTTCCCGAGAGCTCATAAGTACCAGGTACCAAGCCTACAGTACTTAGCACTGAAAGTAGTAAGCGATGTCAGATCCCAGGGAGAGAATCCCACCTGGAAACAGTGGAGAAGAGACAATAGGAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAGGAGATAAACAGAGAGGCGGTAAACCACCTACCAAGGGAGCTAATTTTCCAGGTTTGGCAAAGGTCTTGGGAATACTGGCATGATGAACAAGGGATGTCACCAAGCTATGTAAAATACAGATACTTGTGTTTAATACAAAAGGCTTTATTTATGCATTGCAAGAAAGGCTGTAGATGTCTAGGGGAAGGACATGGGGCAGGGGGATGGAGACCAGGACCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAATGGAAGAAAGACCTCCAGAAAATGAAGGACCACAAAGGGAACCATGGGATGAATGGGTAGTGGAGGTTCTGGAAGAACTGAAAGAAGAAGCTTTAAAACATTTTGATCCTCGCTTGCTAACTGCACTTGGTAATCATATCTATAATCGTCACGGAGACACTCTAGAGGGAGCAGGAGAACTCATTAGAATCCTCCAACGAGCGCTCTTCATGCATTTCAGAGGCGGATGCATCCACTCCAGAATCGGCCAACCTGGGGGAGGAAATCCTCTCTCAGCTATACCGCCCTCTAGAAGCATGCTGTAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGGAGTAAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCCTATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATGAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATTTGAATATCACTAAGAATACTACTAATCTCACTAGTAGCAGCTGGGGAATGATGGAGGAAGGAGAAATAAAAAATTGCTCTTTCTATATCACCACAAGCATAAGAAATAAGGTAAAGAAAGAATATGCACTTTTTAATAGACTTGATGTAGTACCAGTAAAAAATACTAGTAATACTAAGTATAGGTTAATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTCAGCCAATTCCCATACATTATTGTGTCCCGGCTGGGTTTGCGATACTAAAGTGTAACAATAAGACATTCAATGGATCAGGACCATGCACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTGGTGTCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGACATAGTAATTAGATCTGAAGATTTCACAGACAATGTTAAAACCATAATAGTACAGCTAAATGAATCTGTAGTAATTAATTGTACAAGACCCAACAACAATACAAGAGAAAGGTTATCTATAGGACCAGGGAGAGCATTTTATGCAAGAAGAAACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTACAACAGATAGTTATAAAATTAAGAGAAAAATTTAGGAATAAAACAATAGCCTTTAATCAATCCTCAGGAGGGGACCCAGAAATTGTAATGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAGCACAACTGTTTAATAGTACTTGGAATGTTGCTGGAGGGACAAATGGCACTGAAGGAAATGACATAATCACACTCCAATGCAGAATAAAACAAATTATAAATATGTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCACAGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTACTAACAAGAGATGGAGGTAATAGTACTGAGACTGAGACTGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCAATAGGAGTAGCACCCACCAGGGCAAAGAGAAGAACAGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGGCTATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGAATATGTTGCGACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAGGGATCAACAGCTCATGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTTCTGTGCCTTGGAATGTTAGTTGGAGTAATAAATCTGTGGATGATATTTGGAATAACATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAGACTATATATATGACTTACTTGAAAAATCGCAAACCCAACAAGAAAAGAATGAAAAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAGATTATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATCAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTACAATATGGGTGGAGCTATTTCCATGAGGCGGTCCAGGCCGTCTGGAGATCTGCGACAGAGACTCTTGCGGGCGCGTGGGGAGACTTATGGGAGACTCTTAGGAGAGGTGGAAGATGGATACTCGCAATCCCCAGGAGGATTAGACAAGGGCTTGAGCTCACTCTCTTGTGAGGGACAGAAATACAATCAGGGACAGTATATGAATACTCCATGGAGAAACCCAGCTGAAGAGAGAGAAAAATTAGCATACAGAAAACAAAATATGGATGATATAGATGAGGAAGATGATGACTTGGTAGGGGTATCAGTGAGGCCAAAAGTTCCCCTAAGAACAATGAGTTACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATATACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTATACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTATTTAATGCATCCAGCTCAAACTTCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTGGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAAACAGCAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGTTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTA'),
('E660', 'Virus', 'E660', 'RNA', 'SIV', 'GGGACTTGAAGGAGAGTGAGAGCTCCTGAGTACGGMTGWGTGAAGGCAGTAAGGGCGGCAGGAACAAAMCACGACGGAGAGCTCCTAGAAAGGCGCGGGCCGGTACCAGGCGGCGTGAGGAGCGGGAGTCGGAGAGGCCTCCGGTTGCAGGTAAGTGCAACAGAAAAGTCATAGGACTGAGTTCCCTACTTTTGAGGAAAGAGTAGGAGAGTGGGAGATGGGCGCGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGTTACGGCCCAACGGAAAGAAAAAGTATATGTTGAAGCATRTAGTATGGGCAGCAAATGAATTGGACAGATTTGGATTAGCAGAAAGCCTGTTGGATAACAAAGAAGGTTGTCAAAAAATTCTTTCRGTTTTAGCTCCATTAGTTCCGACAGGTTCAGAAAATTTAAAGAGCCTTTATAATACTGTCTGCGTCATTTGGTGCATTCACGCAGAAGAGAAAGTGAAACATACTGAGGAAGCAAAACAAATAGTGCAGAGACATCTAGTGGTGGAAACAGGAACAGCAGACAAAATGCCAGCAACAAGCAGACCAACAGCACCACCTAGTGGCAGAGGAGGAAATTACCCAGTGCAGCAARTAGGTGGCAATTATGTCCACCTACCCTTAAGTCCAAGAACATTAAATGCTTGGGTAAAATTRGTAGAAGAGAAAAAATTTGGGGCAGAGGTAGTGCCAGGATTTCAAGCGCTATCAGAAGGCTGCACTCCCTATGATATCAATCAAATGCTAAATTGTGTAGGAGAACATCAGGCAGCCATGCAAATTATTAGAGAGATTATAAATGAAGAAGCTGCCGATTGGGATTTACAACACCCGCARCCAGGTCCACTACCAGCAGGGCAACTTAGAGAGCCAAGAGGATCAGACATTGCAGGAACTACTAGTACAGTAGATGAACAAATCCAATGGATGTACAGGCAACAAAACCCYATACCAGTAGGCAACATTTATAGAAGGTGGATCCAATTAGGGCTGCAGAAATGTGTAAGAATGTATAACCCAACAAACATTTTAGATGTGAAACAAGGACCAAAAGAGCCATTTCAAAGCTACGTAGATAGATTCTAYAAAAGTCTAAGAGCAGAGCAAACAGATCCGGCAGTAAAGAATTGGATGACCCAAACACTGCTGATTCAAAATGCTAACCCAGATTGTAAATTRGTGCTCAAGGGTCTGGGTATGAATCCCACTTTAGAAGAAATGCTGACAGCCTGTCAGGGAATAGGAGGGCCAGGACAAAAAGCTAGATTAATGGCAGAAGCATTGAAAGAGGCACTGAGACCAGACCAACTCCCATTTGCAGCAGTCCAACAGAAAGGACAAAGGAGGACAATCAAGTGTTGGAATTGTGGAAAGGAGGGACACTCTGCAAGACAATGCAGGGCCCCTAGAAGACAGGGCTGCTGGRRGTGYGGAAAMACGGGTCATGTTATGGCCAAATGCCCTGAAAGACAGGCGGGTTTTTTAGGGCTTGGCCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCCCAGATGCCTCAGGGGCTGATACCAACTGCTCCCCCAGAGGATCCAGCTGTGGATCTACTGAAGAATTACATGAAGATGGGCAGAAAGCAGAGGGAGAACAGAGAGAGACCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGAAGACCAGTAGTCACTGCCTACATTGAAGAACAGCCCGTAGAAGTATTATTAGATACAGGGGCTGACGATTCAATTGTAGCAGGGATAGAATTGGGTCCAAATTATACCCCTAAAGTAGTAGGAGGAATAGGAGGCTTCATTAATACCAAAGAATATAAAGATGTAAAAATAAAAGTCTTAGGCAAGGTAATTAAGGGAACAATTATGACGGGAGATACCCCAATTAATATTTTTGGCAGAAATTTGCTAACAGCTATGGGCATGTCYTTAAATCTCCCCATAGCTAAGGTGGAGCCTATAAAAGTAACACTAAAACCAGGGAAAGAAGGACCAAAATTGAGACAGTGGCCGCTATCAAAAGAAAAGATAATTGCATTAAGAGAAATCTGTGAAAAAATGGAAAAAGATGGCCAGTTAGAGGAAGCCCCTCCAACCAATCCGTATAACACCCCCACTTTTGCTATAAAGAAGAAAGACAAAAATAAATGGAGGATGCTAATAGATTTTAGAGAATTRAATAAGGTCACTCAAGACTTTACAGAAGTACAGTTAGGAATACCACACCCTGCAGGACTAGCAAAGAGAAGGAGGATCACAGTATTGGATGTAGGTGATGCATATTTCTCCATACCTCTAGATGAAGAATTCAGGCARTACACTGCCTTTACTTTACCATCAGTAAATAATGCWGAACCAGGAAAAAGATACATCTATAAGGTATTACCTCAAGGGTGGAAGGGGTCACCAGCTATTTTTCAGTATACTATGAGAAATGTATTAGAACCTTTCAGAAAAGCAAATCCAGATGTGACCCTGATCCAATACATGGATGACATCTTAATAGCTAGTGATAGAACAGATTTAGAGCATGACAGGGTAGTTTTACAGTTAAAGGAACTTCTRAACGGCATAGGATTCTCYACCCCAGARGAGAAGTTCCAGAAAGATCCCCCATTCCAGTGGATGGGATATGAATTGTGGCCAACCAAATGGAAACTGCAGAAAATAGAGTTGCCACAAAGAGAGACCTGGACAGTAAATGACATACAAAAATTAGTAGGAGTGCTAAATTGGGCAGCACAAATTTATCCAGGAATAAAGACTAAACATCTTTGCAGACTAATCAGAGGAAAAATGACTTTAACAGAAGAGGTTCAGTGGACTGAGATGGCAGAGGCAGAATATGAAGAAAAYAAGATAATTCTCAGTCAAGAACAAGAAGGATGTTACTACCAAGAGGGAAAACCAATAGAGGCAACAGTAATAAAGAGTCAGGATAATCAATGGTCATATAAAATTCACCAAGAAGACAAAGTACTGAAAGTAGGTAAATTTGCAAAGGTTAAAAATACACATACAAATGGAGTCAGATTAYTAGCACACGTAGTGCAGAAAATAGGAAAAGAAGCACTAGTAATTTGGGGAGAGGTGCCAAAATTCCATTTGCCAGTAGAAAGAGAAATTTGGGAACAATGGTGGACAGATTATTGGCAAGTRACCTGGATACCAGATTGGGACTTTGTGTCAACACCTCCCTTAGTCAGATTAGTCTTCAACCTAGTAAAAGAGCCTATACAGGGGGCAGAAACATTYTATGTAGATGGATCCTGTAATAGGCAGTCAAGAGAAGGAAAAGCAGGCTATGTGACGGATAGGGGCAGAGACAAAGCAAAACTTTTAGAACAGACTACCAACCAACAAGCAGAGTTGGAAGCCTTTTATCTAGCCTTARCAGATTCGGGACCRAAAGCAAATATTATAGTAGATTCCCAATATGTTATGGGCATAATAGCAGGTCAACCCACTGAATCAGAAAGTAGGTTAGTAAACCAGATAATAGAGGAGATGATTAAAAARGAAGCAATTTATGTAGCATGGGTRCCTGCACATAAAGGAATAGGAGGAAATCAAGAAGTAGATCACCTGGTTAGCCAGGGAATTAGACAAGTCCTATTCTTAGAAAAAATAGAACCAGCACAAGAAGAGCATGAAAAGTACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGTTTACCTAGGCTAGTAGCAAAACAGATAGTAGACACATGTGATAAATGCCACCAGAAAGGAGAAGCCATACATGGGCAAGTAAATGCAGAACTAGGGACTTGGCAAATGGACTGTACGCACCTAGAAGGCAAAATAATTATAGTTGCAGTACATGTGGCTAGTGGATTCATAGAGGCAGAAGTAATCCCGCAGGAAACAGGAAGACAAACAGCACTGTTTCTGTTAAAGTTAGCTGGCAGATGGCCTATCACACATCTGCATACTGATAATGGTGCCAATTTCACATCACAAGAAGTGAAAATGGTTGCCTGGTGGGCAGGGATTGAACAGACCTTTGGGGTGCCTTATAATCCACAGAGCCAAGGAGTAGTGGAAGCAATGAACCATCATTTAAAAACCCAGATAGATAGAATTAGAGAACAAGCAAACTCAATAGAGACYATAGTACTAATGGCAGTTCATTGYATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAGTCAATATGATCACCACAGAACAAGAAATACAATTCCAACAATCAAAAAATTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGACCAGCTGTGGAAAGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCCTAAAGGTAGGGACAGAGATCAAGGTAGTACCAAGGAGGAAAGCTAAAATTATCAAAGACTATGGAGGAGGAAAAGAATTGGATAGTGGTTCCCACTTGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATCAAACACCTGAAATATAACACTAAAGACCTACAGATGGCTTGTTATGTGCCCCATCATAAAGTTGGATGGGCATGGTGGACTTGCAGCAGAGTAATTTTCCCATTAAGRGATGAGACTCATTTGGAAGTACAAGGATATTGGAATTTGGCACCAGAAAAAGGATGGCTCAGTACTCATGCAGTAAGAATAACCTGGTACTCCAGAAATTTCTGGACAGATGTAACACCAGATTATGCAGACACTTTACTGCATAGCACTTATTTCCCTTGCTTTTCAGAGGGAGAAGTACGAAGGGCCATCAGGGGAGAGAAATTGCTGTCTTGCTGCAAGTTCCCGAAAGCTCATAAAAATCAGGTACCAAGCCTACAGTATCTAGCACTAACAGTAGTAAGTCATGTCAGATCCCAGGGAGAGGATCCCACCTGGAAACAGTGGGGAAGAAACAATAGAAGARGCCTTCGAATGGCTAAACAGAACAGTAGAAGGAATAAACAGGGCAGCAGTAAATCACCTGCCGAGGGAGCTAATTTTCCAGGTTTGGCGAAGGTCCTGGGAATACTGGCATGATGAWATGGGRATGTCAGAAAGCTACACAAAATATAGATACTTGTGCTTGATACAGAAAGCTCTGTTTGTGCATTGCAAGAAAGGGTGTAGGTGCTTAGGAGARGRGCATGGGGCAGGGGGATGGAGAACAGGGCCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAAATGGCAGAAAGACCTCCAGAAGATGAAGCCCCACAGAGGGAACCATGGGATGAATGGGTAGTGGAAGTTCTGGAGGAATTAAAAGAAGAAGCCCTGAAACATTTTGATCCTCGCTTGCTAACTGCGCTTGGTAACTATATTTATGATAGACATGGAGACACCCTTGAAGGAGCAGGAGAACTCATTAGAATCCTGCAGAGAGCACTCTTCATCCATTTCAGAAGTGGATGTGCCCACTCCAGAATCGGCCAATCTAGAGGAGGAAATCCTCTATCAACTATACCGCCCTCTAGAGACATGCTATAACAAGTGCTACTGTAAGAGGTGTTGCTATCATTGTCAGCATTGTTTTCTTAAAAAGGGTTTGGGAATATGCTATGAGCAGCACCGAAGAAGAACTCCGAAAAAGACTAAGGCTAATCCACTTCCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCGCTCTTGCTAGTAAGTGCTTTAGAGATTTATTGTGTTCAATATGTAACAGTATTCTATGGTGTACCAGCATGGAAGAATGCGACAATTCCCCTCTTCTGTACAACCAGGAATAGGGACACTTGGGGAACAACACAATGCTTGCCAGATAATGATGATTACTCAGAATTGGCAATCARTATCACAGAGGCTTTTGATGCTTGGAATAATACAGTCACAGAACAAGCAATAGAGGATGTGTGGAACCTCTTTGAAACATCCATTAAGCCCTGTGTAAAACTCACCCCACTATGTATAGCAATGAGATGTAATAAAACTGAGACAGATAGGTGGGGTTTGACAAGRAACGCAGGGACAACAACAACAACAACAACAACAACAACAGCAGCAACACCAAGTGTRGCAGAAAATGTTATAAATGAAAGTAATCCTTGCATAAAAAATAATAGTTGTGCAGGCTTGGAACAGGAGCCCATGATAGGTTGTAAATTTAACATGACAGGGTTAAAAAGGGACAAAAGGATAGAATATAATGAAACATGGTATTCAAGAGATTTAATCTGTGAGCAGTCAGCGAATGAAAGTGAGAGTAAATGTTACATGCATCATTGTAACACCAGTGTTATTCAGGAATCCTGTGACAAGCATTATTGGGATGCTATTAGATTTAGATATTGTGCACCGCCAGGTTATGCTTTGCTTAGGTGTAATGATTCAAATTATTCAGGCTTTGCTCCTAACTGTTCTAAGGTAGTGGTTTCTTCATGCACAAGAATGATGGAGACGCAAACCTCTACTTGGTTTGGCTTCAATGGTACTAGGGCAGAAAATAGAACATACATTTATTGGCATGGCAAAAGTAATAGAACCATAATTAGCTTAAATAAGTATTATAATCTAACAATGAGATGTAGAAGACCAGGAAATAAGACAGTTTTACCAGTCACCATTATGTCAGGGTTGGTCTTCCATTCGCAACCCATAAATGAGAGACCAAAACAGGCCTGGTGCTGGTTTGGAGGAAGCTGGAAAGAGGCCATCCAGGAAGTGAAGGAAACCTTGGTCAAACATCCCAGGTATACGGGAACTAATGATACTAAGAAAATTAATCTAACAGCTCCAGCAGGAGGAGATCCAGAAGTCACTTTTATGTGGACAAATTGTAGAGGAGAATTCTTATACTGCAAAATGAATTGGTTTCTTAATTGGGTAGAGGACAGAGACCAAAAGRGTAGCAGATGGAGACAACAAAATACGAGAGAGCGACAGAAGAAAAATTATGTGCCATGTCATATTAGACAAATAATCAACACGTGGCACAAAGTAGGCAAAAATGTATATTTGCCTCCTAGGGAAGGAGACCTGACATGTAATTCCACTGTAACTAGTCTCATAGCAGAGATAGATTGGACCAATAACAATGAGACCAATATCACCATGAGTGCAGAGGTGGCAGAACTGTATCGATTGGAGTTGGGAGATTACAAATTAGTAGAGATTACTCCAATTGGCTTGGCCCCCACAAGTGTAAGAAGGTACACCACAACTGGTGCCTCAAGAAATAAGAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCGACAGCAGGTTCTGCAATGGGCGCGGCGTCGCTGACGCTGTCGGCTCAGTCCCGGACTTTGTTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGATGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACTAAGAACCTCCAGACTAGAGTCACTGCTATCGAGAAGTACCTGAAGGATCAGGCGCAGCTAAATTCATGGGGATGTGCTTTTAGGCAAGTCTGTCACACTACTGTACCATGGCCAAATGAAACATTGGTGCCTAATTGGAGCAATATGACTTGGCAAGAGTGGGAAAGACAGGTTGACTTCCTAGAGGCAAATATAACTCAATTATTAGAAGAAGCACAAATTCAGCAAGAAAAGAATATGTATGAATTGCAAAAACTAAATAGCTGGGATATCTTTGGCAATTGGTTTGACCTTACTTCTTGGATAAGATATATACAATATGGTGTACTAATAGTTTTAGGAGTAGTAGGGTTAAGAATAGTAATATATGTAGTGCAGATGTTAGCTAGGTTAAGACAGGGTTATAGGCCAGTGTTCTCTTCCCCTCCCGCTTATGTTCAGCAGATCCCTATCCACAAGGGCCAGGAACCGCCAACCAAAGAAGGAGAAGAAGGAGAAGGTGGAGACAGAGGTGGCAACAGATCTTGGCCTTGGCAGATAGAATATATTCATTTCCTAATCCGCCAACTGATACGCCTCTTGACTTGGCTATTCAGCAGCTGCAGGGATTGGCTATTGAGGAYCTACCAGRTCCTCCAACCAGTRCTCCAGAGCCTCTCAACGACGTYGCAAAGAGTCCGTGAAGTCATCAGAATTGGAATAGCCTACCTACAATATGGGTGGCGTTATTTCCAAGAAGCAGTGCAGGCGTGGTGGAAATTTGCGCGAGAGACTCTTGCAAGCGCGTGGAGAGACATATGGGAGACTCTGGGAAGGGTTGGAAGAGGGATACTCGCAATCCCKAGGCGCRTCAGGCAAGGGYTTGAGCTCRCTCTCTTGTGAGCCTCAGAAATATAGTGAGGGACAATATATGAATACCCCCTGGAGGAACCCAGCAGCAGAAAGAGCAAAATTAGGTTATAGACAACAAAACATGGATGATGTGGATGATGAAGATGATGACTTAGTARGTGTCTCAGTGCACCCAAGAGTCCCCTTAAGGGCCATGACATACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAATGAGAAAAGACATAGAATATTAGATATGTACATGGAAAAGGAAGAAGGAATAATACCAGATTGGCAAAATTACACATCAGGGCCAGGAACTAGATACCCTATGTACTATGGGTGGCTCTGGAAATTAGTCCCAGTAGATGTCTCAGATGARGCTCAGGAAGACGAGACACATTGCCTGATGCATCCGGCACAGACTCATCAGTGGGATGACCCCTGGGGAGAGGTACTGGCATGGAAGTTTGATCCAGAATTAGCTTATAGCTATAAGGCATTTATTAAGTACCCAGAAGAGTTTGGTAGTAAGTCAGRCTTGTCAGAGGAAGAGGTAAAGAGAAGGCTAACCGCAAGAGGCCTTATTAAAATGGCTGACAAGAAGGAAACAAGCTGAGACAGCAGGGACTTTCCACAAGGGRCTKTCACATGGGGAGGTWCTGGGGAGGAACTGGGGAGGAGCTGGCTGGAACGCCCACTTATTCTCTGTATAAATATAACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGGCTCCACGCTTGCTTGCTTAAAGACCTCTTCAATAAAGCTGCCATTTAGAAGTAAGCAAGTGTGTGTTCCCATCTCTCCTAGTCGCCGCCTGGTCATCTCGGTACTCGACAYATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTT'),
('HXB2', 'Virus', 'HXB2', 'RNA', 'HIV', 'GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAATCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTGATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCAGCGGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACACAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCCCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGGTCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGCCCTATTGAGACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAGATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGGAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGAGGAACCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTGCCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTTAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTGTCACCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACTGACAATGGCAGCAATTTCACCGGTGCTACGGTTAGGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAAATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGCCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACACATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGCAACCTATACCAATAGTAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGAAGAATGATACTAATACCAATAGTAGTAGCGGGAGAATGATAATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAGGTAAGGTGCAGAAAGAATATGCATTTTTTTATAAACTTGATATAATACCAATAGATAATGATACTACCAGCTATAAGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGTCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACACATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGAATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATAACACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGAAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAGCAACAATGAGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCCTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATCACACGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAACCCCGAGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTGGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTGTAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAAGATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATAGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTAGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGACATCGAGCTTGCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTC'),
('SIVmac251_CMstock', 'Virus', 'SIVmac251_CMstock', 'RNA', 'SIV', 'XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXATAGAGTGGGAGATGGGCGCGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGCTACGACCCGGCGGAAAGAAAAAGTACATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTAGATAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGATGTCAAAAAATACTTTCGGTCTTAGCTCCATTAGTGCCAACAGGCTCAGAAAATTTAAAGAGTCTTTATAATACTGTCTGCGTCATCTGGTGCATTCACGCAGAAGAGAAAGTGAAACACACTGAGGAAGCAAAACAGATAGTGCAGAGACACCTAGTGGTGGAAACAGGAACAGCAGAAACTATGCCAAAAACAAGTAGACCAACAGCACCATCTAGCGGCAGAGGAGGAAATTACCCAGTACAACAAATAGGTGGTAACTATGTCCACCTGCCATTAAGCCCGAGAACATTAAATGCCTGGGTAAAATTGATAGAGGAAAAGAAATTTGGAGCAGAAGTAGTGCCAGGATTTCAGGCACTGTCAGAAGGCTGCACCCCCTATGACATTAATCAGATGTTAAATTGTGTGGGAGACCATCAAGCGGCTATGCAGATTATCAGAGATATTATAAACGAGGAGGCTGCAGATTGGGACTTGCAGCACCCACAACCAGCTCCACAACAAGGACAGCTTAGGGAGCCGTCAGGATCAGATATTGCAGGAACAACTAGCTCAGTAGATGAACAAATCCAGTGGATGTACAGACAACAGAACCCCATACCAGTAGGCAACATTTACAGGAGATGGATCCAACTGGGGTTGCAAAAATGTGTCAGAATGTATAATCCAACAAACATTCTAGATGTAAAACAAGGGCCAAAAGAGCCATTTCAGAGCTATGTAGACAGATTCTACAAAAGCTTAAGAGCAGAACAAACAGATGCAGCAGTAAAGAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCAGATTGCAAGCTAGTGCTGAAGGGGCTGGGTGTGAATCCCACCCTAGAAGAAATGCTGACGGCTTGTCAAGGAGTAGGGGGACCAGGACAGAAGGCTAGATTAATGGCAGAAGCCCTGAAAGAGGCCCTCGCACCAGTGCCAATCCCTTTTGCAGCAGCCCAACAGAGAGGACCAAAAAAGCCAATTAAATGTTGGAATTGTGGGAAAGAAGGACACTCTGCAAGGCAATGCAGAGCCCCAAGAAGACAGGGATGCTGGAAATGTGGAAAAATGGACCATGTTATGGCCAAATGCCCAGACAGACAGGCGGGTTTTTTAGGCCTTGGTCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCTCAAGTGCATCAGGGGCTGACGCCAACTGCTCCCCCAGAGGACCCAGCTGTGGATCTGCTAAAGAACTACATGCAGTTGGGCAAGCAGCAGAGAGAAAAGCAGAGAGAAAGCAGAGAGAAGCCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGGAGACCAGTAGTCACTGCTCATATTGAAGGACAGCCTGTAGAAGTATTACTGGATACAGGGGCTGATGATTCTATTGTAACAGGAATAGAGTTAGGTCCACATTATACCCCAAAAATAGTAGGAGGAATAGGAGGTTTTATTAATACTAAAGAATACAAAAATGTAGAAATAGAAGTTTTAGGCAAAAGGATTAAGGGGACAATCATGACAGGGGACACCCCGATTAACATTTTTGGTAGAAATTTGCTAACAGCTCTGGGGATGTCTCTAAATCTTCCCATAGCTAAGGTAGAGCCTGTAAAAGTCGCCTTAAAGCCAGGAAAGGTTGGACCAAAATTGAAGCAGTGGCCATTATCAAAAGAAAAGATAGTTGCATTAAGAGAAATCTGTGAAAAGATGGAAAAGGATGGTCAGTTGGAGGAAGCTCCCCCGACCAATCCATACAACACCCCCACATTTGCTATAAAGAAAAARGATAAGAACAAATGGAGAATGCTGATAGATTTTAGGGAACTAAATAGGGTCACTCAGGACTTTACAGAAGTCCAATTAGGAATACCACACCCTGCAGGACTAGCAAAAAGGAAAAGGATTACAGTACTGGAYATAGGTGACGCATATTTCTCCATACCTCTAGATGAAGAATTTAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAGCCAGGAAAACGATACATTTATAAGGTTCTGCCTCAGGGATGGAAGGGGTCACCAGCCATCTTCCAATACACTATGAGACATGTGCTAGAACCCTTCAGGAAGGCAAATCCAGATGTGACCTTAGTCCAGTATATGGATGACATCTTAATAGCTAGTGACAGGACAGACCTGGAACATGACAGGGTAGTTTTACAGTTAAAGGAACTCTTAAATAGCATAGGGTTTTCTACCCCAGAAGAGAAATTCCAAAAAGATCCCCCATTTCAATGGATGGGGTACGAATTGTGGCCGACAAAATGGAAGTTGCAAAAGATAGAGTTGCCACAAAGAGAGACCTGGACAGTGAATGATATACAGAAGTTAGTAGGAGTATTAAATTGGGCAGCTCAAATTTATCCAGGTATAAAAACCAAACATCTCTGTAGGTTAATTAGAGGAAAAATGACTTTAACAGAGGAAGTTCAGTGGACTGAGATGGCAGAAGCAGAATATGAGGAAAATAAGATAATTCTCAGTCAGGAACAAGAAGGATGTTATTACCAAGAAGGCAAGCCATTAGAAGCCACGGTAATAAAGAGTCAGGACAATCAGTGGTCTTATAAAATGCACCAAGAAGACAAAATACTGAAAGTAGGAAAATTTGCAAAGATAAAGAATACACATACCAATGGAGTTAGACTATTAGCACATGTAATACAGAAAATAGGAAAGGAAGCAATAGTGATCTGGGGACAGGTCCCAAAATTCCACTTACCAGTTGAGAGGGATGTATGGGAACAGTGGTGGACAGACTATTGGCAGGTAACCTGGATACCGGAATGGGATTTTATCTCAACACCACCACTAGTAAGATTAGTCTTCAATCTAGTGAAGGACCCTATAGAGGGAGAAGAAACCTATTATACAGATGGATCATGTAATAAACAGTCAAAAGAGGGGAAAGCAGGATATATCACAGATAGGGGCAAAGACAAAGTAAAAGTGTTAGAACAGACTACTAATCAACAAGCAGAATTGGAAGCATTTCTCATGGCATTGACAGACTCAGGGCCAAAGGCAAATATTATAGTAGATTCACAATATGTTATGGGAATAATAACAGGATGCCCTACAGAATCAGAGAGCAGGCTAGTTAACCAAATAATAGAAGAAATGATTAAAAAGTCAGAAATTTATGTAGCATGGGTACCAGCACACAAAGGTATAGGAGGAAACCAAGAAATAGACCACCTAGTTAGTCAGGGGATTAGACAAGTTCTCTTCTTGGAAAAGATAGAGCCAGCACAAGAAGAACATGATAAATACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGATTACCCAGAATAGTGGCCAGACAGATAGTAGACACATGTGATAAATGTCATCAGAAAGGAGAAGCTATACATGGGCAGGTAAATTCGGATCTAGGGACTTGGCAAATGGATTGTACCCATCTAGAGGGAAAAATAGTCATAGTTGCAGTACATGTAGCTAGTGGATTCATAGAAGCAGAAGTAATTCCACAAGAAACAGGAAGACAGACAGCACTATTTCTGTTAAAATTGGCAAGCAGATGGCCTGTTACACATCTACACACAGATAATGGTGCTAACTTTGCTTCGCAAGAAGTAAAGATGGTTGCATGGTGGGCAGGGATAGAGCACACCTTTGGGGTACCATACAATCCACAGAGTCAGGGAGTAGTGGAAGCAATGAATCACCATCTGAAAAATCAAATAGATAGAATCAGGGAACAAGCAAATTCAGTAGAAACCATAGTATTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAATTAACATGATCACTACAGAACAAGAAATACAATTTCAACAATCAAAAAACTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAACTGTGGAAGGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCTTAAAGGTAGGGACAGACATTAAGGTAGTACCCAGAAGAAAGGCTAAAATTATCAAAGATTATGGAGGAGGAAAAGAGGTGGATAGCAGTTCCCACATGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATAAAATATCTGAAGTATAAAACTAAAGATCTACAAAAGGTTTGCTATGTGCCCCATTATAAGGTCGGATGGGCATGGTGGACCTGCAGCAGAGTAATCTTCCCACTACAGGAAGGAAGCCATTTAGAAGTACAAGGGTATTGGCATTTGACACCAGAAAGAGGGTGGCTCAGTACTTATGCAGTGAGGATAACCTGGTACTCAAGGAACTTTTGGACAGATGTAACACCAGACTATGCAGACATTTTACTGCATAGCACTTATTTCCCTTGCTTTACAGCGGGAGAAGTGAGAAGGGCCATCAGGGGAGAACAACTGCTGTCTTGCTGCAGGTTCCCGAGAGCTCATAAGAACCAGGTACCAAGTCTACAGTACTTAGCACTGAGAGTAGTAAGTGATGTCAGATCCCAGGGAGAGAATCCCACCTGGAAACAGTGGAGAAGAGACAATAGGAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAGGAGATAAACAGAGAGGCGGTAAACCACCTACCAAGGGAGCTAATTTTCCAGGTTTGGCAAAGGTCTTGGGAATACTGGCATGATGAACAAGGGATGTCACCAAGCTATGTAAAATACAGATACTTGTGTTTAATACAAAAGGCTTTATTTATGCATTGCAAGAAAGGCTGTAGATGTCTAGGGGAAGGACAYGGGGCAGGGGGATGGAGACCAGGACCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAATGGAAGAGAGACCTCCAGAAAATGAAGGCCCACAAAGGGAACCATGGGATGAATGGGTAGTGGAGGTTCTGGAAGAACTGAAAGAAGAAGCTTTAAAACATTTTGATCCTCGCTTGCTAACTGCACTTGGTAATCATATCTATAATAGACATGGAGACACCCTTGAGGGAGCAGGAGAACTCATTAGAATCCTCCAACGAGCGCTCTTCATGCATTTCAGAGGCGGATGCAACCACTCCAGAATCGGCCAACCTGGGGGAGGAAATCCTCTCTCAACTATACCGCCCTCTTGAGGCGTGCTATAACACATGCTATTGTAAAAAGTGTTGCTACCATTGCCAGTTTTGTTTTCTTAAAAAGGGCTTGGGGATATGTTATGAGCAGTCACGAAAGAGAAGAAGAACTCCGAAAAAGGCTAAGGCTAATACATCTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCCATCTTGCTTTTAAGTGTCTATGGGATCTATTGTACTCAATATGTCACAGTCTTTTATGGTGTACCAGCTTGGAGGAATGCGACAATTCCCCTCTTCTGTGCAACCAAGAATAGGGATACTTGGGGAACAACTCAGTGCCTACCAGATAATRRTGATTATTCAGAATTGGCCMTTAATGTTACAGAAAGCTTTGATGCTTGGGAGAATACAGTCACAGAACAGGCAATAGAGGATGTATGGCAACTCTTTGAGACCTCAATAAAGCCTTGTGTAAAATTATCCCCATTATGCATTACTATGAGATGCAATAAAAGTGAGACAGATAAATGGGGATTAACAAAATCATCAACAACAACAACAGCATCAACAACAAGGACAACATCAGCAAAAATAGACATGGTCAATGAGACTAGTTCTTGTATAACTCATAATAATTGCACAGGCTTGGAACAAGAGCAAATGATAAGCTGTAAGTTCAACATGACAGGGTTAAAAAGAGACAAGAAAAAGGAGTACAATGAAACTTGGTACTCTACAGATTTGGTTTGTGAACAAGGGAATAGCACTGATAATGAAAGTAGATGCTACATGAATCACTGTAACACTTCTGTTATCCAAGAGTCTTGTGACAAGCATTATTGGGATACTATTAGATTTAGGTATTGTGCACCTCCAGGTTATGCTTTGCTTAGATGTAATGACACAAATTATTCAGGCTTTATGCCTAAATGTTCTAAGGTGGTGGTCTCTTCATGCACAAGGATGATGGAGACACAGACTTCTACTTGGTTTGGCTTTAATGGAACTAGAGCAGAAAATAGAACTTATATTTACTGGCATGGTAGAGATAATAGGACTATAATTAGTTTAAATAAGTATTATAATCTAACAATGAAATGTAGAAGACCAGGAAATAAGACAGTTTTACCAGTCACCATTATGTCTGGATTGGTTTTCCACTCACAACCAATCAATGATAGGCCAAAGCAGGCATGGTGTTGGTTTGGAGGAAATTGGAAGGATGCAATAAAAGAGGTGAAGCAGACCATTGTCAAACATCCCAGGTATACTGGAACTAACAATACTGATAAGATCAATTTGACGGCTCCTAGAGGAGGAGATCCGGAAGTTACCTTCATGTGGACAAATTGCAGAGGAGAGTTTCTCTACTGTAAAATGAATTGGTTTCTAAATTGGGTAGAAGATAGGAATCTAACTCTAACTACCCAGAAGCTAAGGGAACGGCATAAAAGGAATTACGTGCCATGTCATATTAGACAAATAATCAACACTTGGCATAAAGTAGGCAAAAATGTTTATTTGCCTCCAAGAGAGGGAGACCTCACGTGTAACTCCACAGTGACCAGTCTCATAGCAAACATAGATTGGACTGATGGAAATCAAACTAATATCACCATGAGTGCAGAGGTGGCAGAACTGTATCGATTGGAATTGGGAGATTATAAATTAGTAGAGATCACTCCAATTGGCTTGGCCCCCACAGATGTGAAGAGGTACACTACTGGTGGCACCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCAACGGCAGGTTCTGCAATGGGCGCGGCGTCGTTGACGCTGACCGCTCAGTCCCGGACTTTATTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGACGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACAAAGAACCTCCAGACTAGGGTCACTGCCATCGAGAAGTACTTAAAGGACCAGGCGCAGCTGAATGCTTGGGGATGTGCGTTTAGACAAGTCTGCCACACTACTGTACCATGGCCAAATGCAAGTCTAACACCAGACTGGAACAATGATACTTGGCAAGAGTGGGAGCGAAAGGTTGACTTCTTGGAGGAAAATATAACGGCCCTTCTAGAAGAGGCACAAATTCAACAAGAGAAGAACATGTATGAATTACAAAAGTTGAATAGCTGGGATGTGTTTGGCAATTGGTTTGACCTTGCTTCTTGGATAAGGTATATACAATATGGAATTTATATAGTTGTAGGAGTAATACTGTTAAGAATAGTGATCTATATAGTACAAATGCTAGCTAAGTTAAGGCAGGGGTATAGGCCAGTGTTCTCTTCCCCACCCTCTTATTCCCAGCAGATCCATACCCAACAGGACCCGGCACTGCCAACCAGAGAAGGCAAAGAAGGAGACGGTGGAGAAGGCGGTGGCAACAGCTCCTGGCCTTGGCAGATAGAATATATTCATTTCCTGATCCGCCAACTGATACGCCTCTTGACTTGGCTATTCAGCAACTGCAGAACCTTGCTATCGAGAGTATACCAGATCCTCCAACCAATACTCCAGGGGCTCTCTGCGACCCTACGGAGAATTCGAGAAGTCCTCAGGACTGAACTGACCTACCTACAATATGGGTGGAGCTATTTCCATGAGGCGGTCCAAGCCGGCTGGAGATCTGCGACAGAGACTCTTGCGGGCGCGTGGGGAGACTTATGGGAGACTCTTAGGAGAGGTGGAAGATGGATCCTCGCAATCCCTAGGAGGATTAGACAAGGGCTTGAGCTCACTCTCTTGTGAGGGACAGAAATACAATCAGGGACAGTACATGAATACTCCATGGAGAAACCCAGCTGAAGAGAGAGAAAAATTAGCATACAGAAAACAAAATATGGATGATGTAGATGAGGAAGATGATGACTTGGTAGGGGTACCAGTGATGCCACGAGTTCCCCTAAGAACAATGAGTTACAAATTGGCAATAGATATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATGTACTTAGAAAAGGAGGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTATTTAATGCATCCAGCTCAAACTGCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTAGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAGACAGCAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX'),
('A_Kawasaki_173_2001_PA', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCGAAAGCAGGTACTGATTCGAAATGGAAGATTTTGTGCGACAATGCTTCAATCCGATGATTGTCGAGCTTGCGGAAAAGGCAATGAAAGAGTATGGAGAGGACCTGAAAATCGAAACAAACAAATTTGCAGCAATATGCACTCACTTGGAAGTATGCTTCATGTATTCAGATTTTCATTTCATCAATGAGCAAGGCGAATCAATAATAGTAGAGCCTGAGGACCCAAATGCACTTTTAAAACACAGATTTGAGATAATAGAGGGACGAGATCGTACAATGGCATGGACAGTTGTAAACAGTATTTGCAACACCACAGGAGCTGAGAAACCAAAGTTTCTGCCAGATCTGTATGATTACAAAGAGAATAGATTCATCGAGATTGGAGTGACAAGGAGGGAAGTTCACATATACTATCTGGAAAAGGCCAACAAAATTAAATCTGAAAAGACACACATTCACATTTTCTCATTCACTGGCGAAGAAATGGCCACAAAGGCCGATTACACTCTCGATGAAGAAAGCAGGGCTAGGATTAAAACCAGACTATTCACCATAAGACAAGAAATGGCAAGCAGGGGTCTTTGGGACTCCTTTCGTCAGTCCGAAAGAGGCGAAGAAACAATTGAAGAAAGATTTGAAATCACAGGGACAATGCGCAGGCTTGCTGACCAAAGCCTTCCGCCGAACTTCTCCTGCATTGAGAATTTTAGAGCCTATGTGGATGGATTTGAACCGAACGGCTACATTGAGGGCAAGCTTTCTCAAATGTCCAAAGAAGTAAATGCTAGAATTGAGCCTTTTTTGAAAACAACACCACGACCAATTAGACTTCCGGATGGGCCTCCTTGTTTTCAGCGGTCAAAATTCCTGCTGATGGATTCTTTAAAATTAAGCATTGAGGATCCAAATCATGAAGGAGAGGGAATACCACTATATGATGCAATCAAGTGTATGAGAACATTCTTTGGATGGAAAGAACCCTCTGTTGTCAAGCCACACGAGAAGGGAATAAATCCGAATTATCTGCTGTCATGGAAGCAGGTATTGGAAGAGCTGCAGGACATTGAGAGTGAGGAGAAGATTCCAAGAACAAAGAACATGAAAAAAACGAGTCAGCTAAAGTGGGCACTTGGTGAGAACATGGCACCAGAGAAGGTTGATTTTGATGACTGTAAAGATATAAGCGATTTGAAGCAATATGATAGTGACGAACCTGAATTAAGGTCATTTTCAAGTTGGATCCAGAATGAATTCAACAAGGCATGCGAGCTGACCGATTCAATCTGGATAGAGCTCGATGAGATTGGAGAAGATGTGGCCCCGATTGAACACATTGCAAGCATGAGAAGAAATTACTTCACAGCTGAGGTGTCCCATTGCAGAGCCACAGAATATATAATGAAGGGGGTATACATTAATACTGCTTTGCTTAATGCATCCTGTGCAGCAATGGATGATTTCCAACTAATTCCCATGATAAGCAAATGTAGAACTAAAGAGGGAAGGAGAAAGACCAATTTGTACGGCTTTATCATAAAAGGAAGATCTCACTTAAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAATTTTCCCTCACTGACCCAAGACTTGAGCCACACAAATGGGAGAAGTACTGTGTTCTCGAGATAGGAGATATGCTTCTAAGGAGTGCAATAGGCCAAGTGTCAAGGCCCATGTTCTTGTATGTAAGGACAAATGGAACCTCAAAAATTAAAATGAAATGGGGAATGGAGATGAGGCGTTGCCTCCTCCAATCCCTTCAACAAATAGAGAGCATGATTGAAGCTGAATCCTCTGTCAAGGAGAAAGACATGACAAAAGAGTTTTTTGAGAATAGATCAGAAACATGGCCCATTGGAGAGTCACCAAAGGGAGTGGAAGAAGGTTCCATTGGGAAAGTATGCAGGACACTATTGGCTAAGTCAGTATTCAATAGTCTGTATGCATCGCCACAATTAGAAGGATTTTCAGCTGAGTCAAGAAAGTTGCTCCTCATTGTTCAGGCTCTTAGGGACAATCTGGAGCCTGGGACCTTTGATATTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCTTCTTGGTTCAACTCCTTCCTAACACATGCATTGAGATAGTTGGGGCAATGCTACTATTTACTATCCATACTGTCCAAAAAAGTACCTTGTTTCTACTAATAGGAGACGTGTGTG'),
('A_Kawasaki_173_2001_PB1', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCAGGCAAACCATTTGAATGGATGTCAATCCGACCTTACTTTTCTTAAAAGTGCCAGCACAAAATGCTATAAGCACAACTTTTCCTTATACTGGTGATCCTCCTTACAGCCATGGGACAGGAACAGGGTACACCATGGATACAGTCAACAGGACACATCAGTACTCAGAAAGAGGAAGATGGACAAAAAATACCGAAACTGGAGCACCGCAACTCAACCCAATTGATGGACCACTACCAAAAGACAATGAACCAAGTGGCTATGCCCAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAGGAATCCCATCCTGGTATTTTTGAAAACTCTTGTATTGAAACAATGGAGGTTGTTCAGCAAACAAGGGTGGACAAACTGACACAAGGCAGACAGACCTATGACTGGACTCTAAATAGAAACCAGCCTGCTGCCACAGCATTGGCCAACACTATAGAAGTGTTCAGATCAAACGGCCTCATAGCAAATGAATCTGGGAGGCTAATAGACTTCCTTAAAGATGTAATGAAGTCGATGGACAGAGACGAAGTAGAGATCACAACACATTTTCAGAGAAAGAGGAGGGTGAGAGACAATGTAACTAAAAAAATGGTGACCCAAAGAACAATAGGCAAAAAGAAACATAAATTAGACAAAAGAAGTTACCTAATTAGGGCATTAACCCTGAACACAATGACCAAAGATGCTGAGAGGGGGAAACTAAAACGTAGAGCAATTGCAACCCCAGGAATGCAAATAAGGGGGTTTGTATACTTTGTTGAGACACTGGCAAGAAGCATATGTGAAAAGCTTGAACAATCAGGGTTGCCAGTTGGGGGAAATGAAAAGAAAGCAAAGTTAGCAAATGTTGTAAGGAAGATGATGACCAACTCCCAGGACACTGAAATTTCTTTCACCATCACTGGAGATAACACAAAATGGAACGAAAATCAAAACCCTAGAATGTTTTTGGCCATGATCACATATATAACCAAAAATCAGCCTGAATGGTTCAGAAATATTCTAAGTATTGCTCCAATAATGTTTTCAAACAAAATGGCGAGACTAGGTAAGGGGTACATGTTTGAAAGCAAGAGTATGAAACTGAGAACTCAAATACCTGCAGAGATGCTAGCCAACATAGATTTGAAATATTTCAATGATTCAACTAAAAAGAAAATTGAAAAAATCCGGCCATTATTAATAGATGGAACTGCATCATTGAGTCCTGGAATGATGATGGGCATGTTCAATATGTTAAGCACCGTCTTGGGCGTCTCCATTCTGAATCTTGGGCAAAAGAGATACACCAAGACTACTTACTGGTGGGATGGTCTTCAATCGTCTGATGATTTTGCTCTGATTGTGAATGCACCCAACCATGCAGGAATCCAAGCTGGAGTTGACAGGTTTTATCGAACCTGTAAGCTGCTCGGAATTAATATGAGCAAAAAGAAGTCTTACATAAACAGAACAGGTACCTTTGAATTCACGAGCTTTTTCTATCGTTATGGGTTTGTTGCCAATTTCAGCATGGAGCTTCCTAGTTTTGGGGTGTCTGGGGTCAATGAGTCTGCAGACATGAGTATTGGAGTCACTGTCATCAAAAACAATATGATAAACAATGACCTTGGCCCAGCAACTGCTCAAATGGCCCTTCAGTTATTTATCAAAGATTACAGGTACACGTATCGATGCCACAGAGGTGACACACAAATACAAACCCGGAGATCATTTGAGATAAAGAAACTATGGGACCAAACCCGCTCCAAAGCTGGGCTGTTGGTCTCTGATGGAGGCCCCAATTTATATAACATTAGAAATCTCCATATTCCTGAAGTCTGCTTGAAATGGGAGTTGATGGATGAGGATTACCAGGGGCGTTTATGCAACCCATTGAACCCATTTGTCAGTCATAAAGAGATTGAGTCAGTGAACAATGCAGTGATGATGCCGGCACATGGTCCAGCCAAAAATATGGAGTATGACGCTGTTGCAACAACACACTCCTGGGTTCCCAAAAGGAATCGATCCATTTTGAATACGAGCCAAAGGGGGATACTTGAGGATGAGCAAATGTATCAGAGGTGTTGCAATTTATTTGAAAAATTCTTCCCAAGTAGCTCATACAGAAGACCAGTTGGAATATCCAGTATGGTAGAGGCTATGGTTTCCAGAGCCCGAATTGATGCAAGAATTGATTTCGAATCTGGAAGGATAAAGAAAGAGGAATTCGCTGAGATCATGAAGACCTGTTCCACCATTGAAGACCTCAGACGGCAAAAATAGGGAATTTGGCTTGTCCTTCATGAAAAAATGCCTTGTTTCTACTAATAGGAGACCTGTGTG'),
('A_Kawasaki_173_2001_PB2', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCGAAAGCAGGTCAATTATATTCAATATGGAAAGAATAAAAGAGCTAAGGAATCTGATGTCACAATCTCGCACTCGCGAGATACTTACAAAAACTACTGTAGACCACATGGCCATAATCAAAAAATACACATCCGGAAGACAGGAGAAAAACCCATCACTTAGGATGAAATGGATGATGGCAATGAAATACCCAATTACAGCAGACAAAAGGATAACGGAAATGATTCCTGAAAGAAATGAGCAAGGACAGACATTATGGAGTAAAGTGAATGATGCCGGGTCAGACCGAGTGATGATATCACCCCTGGCTGTGACATGGTGGAATAGAAATGGACCAGTGGCAAGTACTATTCACTATCCAAAAATCTACAAAACTTACTTTGAAAAGGTTGAAAGGTTAAAACATGGAACCTTTGGCCCTGTACACTTTAGAAACCAAGTCAAAATACGCCGAAGAGTCGACATAAATCCTGGTCATGCAGACCTCAGCGCCAAGGAGGCACAGGATGTAATTATGGAAGTTGTTTTCCCTAATGAAGTGGGAGCCAGAATACTAACATCAGAATCGCAATTAACGATAACCAAAGAGAAAAAAGAAGAACTCCAAAATTGCAAAATTTCCCCTTTGATGGTTGCATACATGTTAGAGAGGGAACTTGTCCGCAAAACGAGATTTCTCCCGGTTGCTGGTGGAACAAGCAGTGTGTACATTGAAGTTTTGCATTTAACACAGGGGACATGCTGGGAACAGATGTACACTCCAGGTGGAGAGGTGAGGAATGATGATGTTGATCAAAGCCTAATTATTGCTGCTAGGAACATAGTGAGAAGAGCTGCAGTATCAGCAGATCCACTAGCATCTTTATTAGAAATGTGCCATAGCACACAGATTGGTGGAACAAGGATGGTGGATATTCTCAGGCAAAACCCAACAGAAGAACAAGCTGTGGATATATGCAAAGCAGCAATGGGGCTGAGAATCAGTTCATCCTTCAGTTTTGGCGGATTCACATTCAAGAGAACAAGTGGATCATCAGTCAAAAGGGAGGAAGAAATGCTCACGGGCAATCTGCAAACATTGAAGCTAACTGTGCATGAGGGATATGAAGAGTTCACAATGATTGGGAAAAGGGCAACAGCTATACTTAGAAAAGCAACCAGGAGATTGATTCAACTAATAGTGAGTGGACGAGACGAACAGTCGATAGTCGAAGCAATAGTTGTAGCAATGGTATTCTCACAAGAAGATTGCATGGTAAAAGCAGTTAGAGGTGATCTGAATTTCGTCAATAGAGCGAATCAGCGGTTGAATCCCATGCATCAACTTTTGAGACATTTTCAGAAGGATGCTAAAGTACTTTTCTTAAATTGGGGAATTGAACCTATCGACAATGTGATGGGAATGATTGGGATATTACCTGATATGACTCCAAGTACCGAGATGTCAATGAGAGGAGTGAGAGTCAGCAAAATGGGTGTAGATGAATACTCCAATGCTGAAAAGGTAGTGGTGAGCATTGACCGTTTTTTGAGAGTCCGGGACCAAAGAGGAAATGTACTACTGTCTCCAGAGGAAGTCAGTGAGACACAGGGAACAGAGAAACTGACAATAACTTACTCTTCATCAATGATGTGGGAGATTAATGGCCCTGAGTCAGTGTTGATCAATACCTATCAGTGGATCATCAGAAACTGGGAGACTATTAAAATTCAGTGGTCTCAGAACCCTACAATGCTATACAATAAAATGGAATTCGAGCCATTTCAGTCTCTAGTCCCTAAGGCCATTAGAGGCCAATACAGTGGGTTTGTTAGAACTCTATTCCAACAAATGAGGGATGTGCTTGGGACCTTTGACACAACTCAGATAATAAAACTTCTTCCCTTTGCAGCCGCTCCACCAAAGCAAAGTAGAATGCAATTCTCATCATTGACTGTGAATGTGAGAGGATCAGGAATGAGAATACTTGTAAGGGGTAATTCTCCAGTATTCAACTACAACAAGACCACTAAGAAACTCACAGTCCTCGGAAAGGATGCTGGCACTTTAACTGAAGACCCAGATGAAGGCACAGCTGGAGTGGAATCTGCTGTTTTAAGGGGATTCCTCATTCTAGGCAAAGAAGATAGAAGATATGGGCCAGCATTAAGCATCAATGAATTGAGCAACCTTGCGAAAGGAGAAAAAGCTAATGTGCTAATTGGGCAAGGGGACGTAGTGTTGGTGATGAAACGAAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAATTTCGAATAATTTAAAAACGACCTTGTTTCTACT'),
('A_Kawasaki_173_2001_NP', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCAAAAGCAGGGTAGATAATCACTCACTGAGTGACATCAAAGTCATGGCGTCCCAAGGCACCAAACGGTCTTACGAACAGATGGAGACTGATGGGGAACGCCAGAATGCAACTGAAATCAGAGCATCCGTCGGAAGAATGATTGGTGGAATTGGGCGATTCTACATCCAAATGTGCACCGAGCTTAAACTCAATGATTATGAGGGACGACTGATCCAGAACAGCTTAACAATAGAGAGAATGGTGCTCTCTGCTTTTGATGAGAGGAGAAATAAATATCTGGAAGAACATCCCAGCGCGGGGAAAGATCCTAAGAAAACTGGAGGACCCGTATACAAGAGAGTAGATGGAAAGTGGGTGAGGGAACTCGTCCTCTATGACAAAGAAGAAATAAGGCGGATTTGGCGCCAAGCCAACAATGGTGATGATGCAACGGCTGGTTTGACTCACATTATGATCTGGCACTCTAATTTGAATGATACAACTTACCAGAGGACAAGAGCTCTTGTCCGCACCGGAATGGATCCCAGGATGTGCTCTTTGATGCAAGGTTCAACTCTCCCTAGAAGATCTGGAGCAGCAGGCGCTGCAGTCAAAGGAGTTGGGACAATGGTATTGGAATTGATCAGGATGATCAAACGTGGGATCAATGACCGAAACTTCTGGAGGGGTGAGAATGGAAGAAAAACAAGAATTGCTTATGAGAGAATGTGCAACATTCTCAAAGGAAAATTTCAAACAGCTGCACAAAAAGCAATGATGGATCAAGTGAGAGAAAGCCGGAACCCAGGAAATGCTGAGATCGAAGATCTCACTTTTTTGGCACGGTCTGCACTCATATTAAGAGGGTCAGTTGCTCATAAGTCTTGCCTGCCTGCCTGTGTGTATGGACCAGCCGTAGCCAGTGGGTACGACTTCGAAAAAGAGGGATACTCTTTGGTAGGGGTAGACCCTTTCAAACTGCTTCAAACCAGTCAGGTATACAGCCTAATCAGACCAAACGAGAATCCCGCACACAAGAGCCAGTTGGTGTGGATGGCATGCAATTCTGCTGCATTTGAAGATCTAAGAGTGTCAAGCTTCATCAGAGGGACAAAAGTACTTCCAAGGGGGAAGCTCTCCACTAGAGGAGTACAAATTGCTTCAAATGAAAACATGGATGCTATTGTATCAAGTACTCTTGAACTGAGAAGCAGATACTGGGCCATAAGAACCAGAAGTGGAGGGAACACTAATCAACAAAGGGCCTCTGCGGGCCAAATCAGCACACAACCTACGTTTTCTGTGCAGAGAAACCTCCCATTTGACAAAACAACCATCATGGCAGCATTCACTGGGAATACGGAGGGAAGAACATCAGACATGAGGGCAGAAATCATAAAGATGATGGAAAGTGCAAGACCAGAAGAAGTGTCCTTCCAGGGGCGGGGAGTCTTTGAGCTCTCGGACGAAAGGGCAACGAACCCGATCGTGCCCTCCTTTGACATGAGTAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTACGACAATTAAAGAAAAATACCCTTGTTTCTACT'),
('A_Kawasaki_173_2001_HA', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCAAAAGCAGGGGAAAATAATAACAACCAAAATGAAAGCAAAACTACTGGTCCTGTTATGTACATTTACAGCTACATACGCAGACACAATATGTATAGGCTACCATGCCAACAACTCAACCGACACTGTTGACACAGTACTTGAGAAGAATGTGACAGTGACACACTCTGTCAACCTACTTGAGGACAGTCACAATGGAAAACTATGTCTACTAAAAGGAATAGCCCCACTACAATTGGGTAATTGCAGCGTTGCCGGATGGATCTTAGGAAACCCAGAATGCGAATTACTGATTTCCAAGGAATCATGGTCCTACATTGTAGAAACACCAAATCCCGAGAATGGAACATGTTACCCAGGGTATTTCGCCGACTATGAGGAACTGAGGGAGCAATTGAGTTCAGTATCTTCATTTGAGAGATTCGAAATATTCCCCAAAGGAAGCTCATGGCCCAACCACACCGTAACCGGAGTATCAGCATCATGCTCCCATAATGGGAAAAGCAGTTTTTACAGAAATTTGCTATGGCTGACGAGGAAGAATGGTTTGTACCCAAACCTGAGCATGTCCTATGTAAACAACAAAGAGAAAGAAGTCCTTGTGCTATGGGGTGTTCATCACCCACCTAACATAGGGGACCAAAGGGCCCTCTACCATACAGAAAATGCTTATGTCTCTGTAGTGTCTTCACATTATAGCAGAAGATTCACCCCAGAAATAGCCAAAAGACCCAAAGTAAGAGATCAGGAAGGAAGAATCAACTACTACTGGACTCTGCTGGAACCCGGGGACACAATAATATTTGAGGCAAATGGAAATCTAATAGCGCCATGGTATGCTTTCGCACTGAGTAGAGGCTTTGGATCAGGAATCATCACCTCAAATGCACCAATGGATGAATGTGATGCGAAGTGTCAAACACCTCAGGGAGCTATAAACAGTAGTCTTCCTTTCCAGAATGTACACCCAGTTACAATAGGAGAGTGTCCAAAGTATGTCAGGAGTGCAAAATTAAGGATGGTTACAGGACTAAGGAACATCCCATCCATTCAATCCAGAGGTTTGTTTGGAGCCATTGCCGGTTTCATTGAAGGGGGGTGGACTGGAATGGTAGATGGGTGGTATGGTTATCATCATCAGAATGAGCAAGGATCTGGCTATGCTGCAGATCAAAAAAGCACACAAAATGCCATTAACGGGATTACAAACAAGGTGAATTCTGTAATTGAGAAAATGAACACTCAATTCACAGCTGTGGGCAAAGAATTCAACAAATTAGAAAGAAGGATGGAAAACTTAAATAAAAAAGTTGATGATGGGTTTCTAGACATTTGGACATATAATGCAGAATTGTTGGTTCTACTGGAAAATGAAAGGACTTTGGATTTCCATGACTCCAATGTGAAGAATCTGTATGAGAAAGTAAAAAGCCAATTAAAGAATAATGCCAAAGAAATAGGAAACGGGTGTTTTGAATTCTATCACAAGTGTAACAATGAATGCATGGAAAGTGTGAAAAATGGAACTTATGACTATCCAAAATATTCCGAAGAATCAAAGTTAAACAGGGAGAAAATTGATGGAGTAAAATTGGAATCAATGGGAGTCTATCAGATTCTGGCGATCTACTCAACTGTCGCCAGTTCCCTGGTTCTTTTGGTCTCCCTGGGGGCAATCAGTTTCTGGATGTGTTCCAATGGGTCTTTGCAGTGTAGAATATGCATCTGAGACCAGAATTTCAGAAATATAAGAAAAAACACCCTTGTTTCTACT'),
('SIVsmE041', 'Virus', 'SIVsmE041', 'RNA', 'SIV', 'CTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCAGATTGGCGCCTGAACAGGGACTTGAAGGAGAGTGAGAGCTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACAAACCACGACGGAGTGCTCCTATAAAGGCGCGGGCCGGTACCAGGCGGCGTGAGGAGCGGGAGTCGGAGAGGCCTCCGGTTGCAGGTAAGTGCAACAAAAGAGTCATAGGACTGAGTTCCCTACTTTTGAGGAAAGAGTAGGAGAGTGGGAGATGGGCGCGAGAAACTCCGTCTTGTCAGGGAAAAAAGCAGATGAATTAGAAAAAATTAGGTTACGGCCCGGCGGAAAGAAAAAGTACATGCTGAAGCATGTAGTATGGGCAGCAAACGAATTGGACAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGTTGTCAAAAAATTCTTTCAGTCTTAGCTCCATTAGTTCCGACAGGTTCAGAAAATTTAAAGAGCCTTTATAATACTGTCTGCGTCATTTGGTGCATTCACGCAGAAGAGAAAGTGAAACATACTGAGGAAGCAAAACAAATAGTGCAGAGACATCTAGTGGTAGAAACAGGAACAGCAGACAAAATGCCAGTAACAAGTAGACCAACAGCACCACCTAGTGGCAGAGGAGGAAATTACCCAGTGCAGCAAGTAGGTGGCAATTATACCCACCTACCCTTAAGTCCAAGAACATTAAATGCTTGGGTAAAATTGATAGAAGAGAAAAAATTTGGGGCAGAAGTAGTGCCAGGATTCCAAGCACTATCAGAAGGCTGCACTCCCTATGACATCAATCAGATGCTAAATTGTGTAGGGGAACATCAATCAGCCATGCAAATTATTAGAGAAATTATAAATGAAGAAGCTGCTGATTGGGATTTACAACACCCACAGCCAGGTCCAATACCAGCAGGACAACTTAGAGATCCGAGAGGATCAGACATTGCAGGAACTACTAGCACAGTAGAAGAACAAATTCAATGGATGTATAGGCAGCAAAACCCTATACCAGTAGGTAACATTTACAGAAGGTGGATCCAATTAGGGCTGCAAAAATGTGTAAGGATGTATAATCCAACAAACATTTTAGATGTGAAACAAGGACCAAAAGAGCCATTTCAAAGCTATGTAGATAGATTCTACAAGAGTCTAAGAGCAGAACAAACAGACCCAGCAGTGAAAAATTGGATGACTCAAACACTGCTGATTCAGAATGCTAACCCGGATTGCAAATTGGTGCTCAAGGGTCTGGGTATGAATCCCACTTTAGAAGAAATGCTGACAGCCTGTCAGGGAGTAGGAGGACCAGGACAAAAAGCTAGACTAATGGCAGAAGCCTTGAAAGAGGCGCTGACGCCAGGGCAACTCCCATTTGCAGCAGTCCAACAGAGAGGACAAAGAAAGACAATTAAATGTTGGAATTGTGGAAAGGAGGGACACTCTGCGAGACAATGCAGAGCCCCTAGAAGACAGGGATGCTGGAAGTGTGGAAAAACAGGCCATGTTATGGCCAAATGCCCCGAGAGACAGGCGGGTTTTTTAGGGCTTGGCCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCCCAGATACCTCAGGGGTTGACACCAACTGCTCCCCCAGAGGATCCAGCTGTGGATCTACTGAGGAACTACATGAAGATGGGCAGAAGGCAGAGGGAGAACAGAGAGAGACCTTACAAGGAGGTGACGGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGAAGACCAGTAGTTACTGCCTACATTGAAGAACAGCCCGTAGAAGTATTATTAGATACAGGGGCTGATGATTCAATTGTAGCAGGGATAGAATTGGGTCCAAATTATACCCCTAAAATAGTAGGAGGAATAGGAGGTTTCATTAACACCAAGGAATATAAAGATGTAAAAATAAAAGTCTTAGGCAAGGTAATTAAGGGAACAATTATGACAGGAGATACCCCAATTAACATTTTTGGCAGAAATCTGCTAACAGCTATGGGCATGTCTCTAAATCTCCCCATAGCTAAGGTGGAACCTATCAAAGTAACACTAAAACCAGGAAAAGATGGACCAAAATTAAGACAGTGGCCACTATCAAAAGAAAAGATAATTGCATTAAGAGAAATCTGTGAAAAAATGGAAAAAGATGGCCAGTTAGAGGAAGCCCCTCCAACCAATCCATATAACACCCCCACATTTGCTATAAAGAAGAAAGACAAAAATAAATGGAGGATGCTAATAGACTTTAGAGAATTAAACAAGGTTACTCAAGATTTTACAGAAGTACAGTTAGGAATACCACACCCTGCAGGACTAGCAAAGAGAAGAAGGATCACAGTATTGGATGTAGGTGATGCATATTTTTCCATACCTTTAGATGAGGAATTCAGGCAATACACTGCCTTTACTTTACCATCAGTAAACAATGCAGAACCAGGAAAAAGATACATCTATAAGGTATTACCTCAAGGGTGGAAAGGATCACCAGCTATTTTTCAGCATACTATGAGAAATGTCTTAGAACCTTTCAGAAAAGCAAATCCAGATGTGACCCTGATCCAATACATGGATGACATCCTAATAGCTAGTGATAGAACAGATTTAGAACATGACAGGGTAGTTTTACAGTTAAAGGAACTTCTAAACAGTATGGGATTTTCCACCCCAGAAGAGAAGTTCCAGAAAGATCCCCCATTCCAGTGGATGGGATATGAATTGTGGCCAACCAAATGGAAACTGCAAAAAATAGAGTTGCCACAAAAAGAAACCTGGACAGTAAATGATATACAAAAATTAGTAGGAGTGCTAAATTGGGCAGCACAAATTTATCCAGGAATAAAGACTAAACACCTTTGCAGATTAATCAGAGGAAAAATGACTTTAACAGAAGAGGTTCAGTGGACTGAGATGGCAGAGGCAGAATATGAAGAAAACAAGATAATTCTCAGTCAAGAACAAGAAGGGTGTTATTATCAAGAGGGAAAGCCACTGGAGGCAACAGTAATAAAGAGTCAGGATAATCAATGGTCATATAAAATTCACCAAGAAGACAAAATACTAAAAGTAGGCAAATTTGCAAAGATTAAGAATACACATACAAATGGAGTCAGATTATTAGCACATGTAGTACAGAAAATAGGAAAAGAAGCAATAGTAATTTGGGGACAGGTGCCAAAATTTCATTTGCCAGTAGAGAGAGAAATTTGGGAACAATGGTGGACAGATTATTGGCAAGTAACCTGGATACCAGAATGGGACTTTGTATCAACACCTCCCTTAGTCAGATTAGTCTTCAACCTAGTAAAAGAGCCTATACAGGGAGCAGAAACATTTTATGTAGATGGATCCTGTAACAGACAGTCAAAAGAAGGAAAGGCAGGCTATGTGACAGACAGAGGCAGAGACAGAACAAAACCGCTGGAACAGACTACCAATCAACAAGCAGAGTTGGAAGCCTTCCATCTAGCCTTAGCAGATTCAGGACCAAAAGCCAATATAATAGTAGACTCCCAATATGTTATGGGCATAATAGCGGGTCAACCCACTGAATCAGAAAGTAGATTAGTAAATCAGATAATAGAGGAAATGATTAAAAAGGAAGCAATTTATGTAGCGTGGGTACCTGCACATAAAGGAATAGGAGGAAATCAAGAAGTAGATCATCTGGTAAGTCAAGGAATTAGACAAGTCCTATTCTTAGAAAAAATAGAACCAGCGCAAGAAGAGCATGAGAAGTACCATAGCAATGTAAAAGAATTAGTATTCAAATTTGGATTACCTAGGCTAGTAGCAAAACAGATAGTAGACACATGTGATAAATGTCACCAGAAAGGAGAGGCCATACATGGACAAGTAAATGCAGAACTAGGGACTTGGCAAATGGACTGTACACACCTAGAGGGCAAAATAATTATAGTTGCAGTACATGTGGCTAGTGGATTCATAGAGGCAGAAGTAATCCCGCAGGAAACAGGAAGACAAACAGCACTGTTTCTGCTAAAATTAGCCAGCAGATGGCCCATCACACATCTGCATACTGATAATGGTGCCAACTTCACATCGCAAGAAGTGAAAATGGTTGCTTGGTGGGCAGGGATTGAACAGACCTTTGGGGTGCCTTATAATCCACAGAGCCAGGGAGTGGTGGAAGCAATGAACCATCATCTAAAAACCCAGATAGATAGAATTAGGGAACAGGCAAATTCAATAGAGACTATAGTACTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAGTCAATATGATCACCACAGAACAAGAAATACAATTCCAACAATCAAAAAATTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGACCAGCTGTGGAAAGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCCTAAAGGTAGGGACAGAAATCAAGGTAGTACCAAGGAGGAAAGCTAAAATTATCAAAGACTATGGAGGAGGAAAAGAGTTGGATAGCGGTTCCCACTTGGAGGATACCGGGGAGGCTAGAGAAGTGGCATAGCCTCATCAAACACCTGAAATATAACACTAAAGACCTACAGAAGGCTTGTTATGTACCCCATCATAAAGTTGGATGGGCATGGTGGACTTGCAGCAGGGTGATCTTCCCATTAAGGGATGAGTCTCATTTGGAAGTACAAGGATATTGGAATTTGACACCAGAGAAAGGATGGCTCAGTACTTATGCAGTGAGAATAACCTGGTACTCCAGAAATTTCTGGACAGATGTAACACCAGATTATGCAGACACTTTACTGCATGGCACTTATTTCCCTTGCTTTTCAGAGGGAGAAGTACGAAGGGCCATCAGGGGAGAGAAATTGCTGTCTTGCTGCAAGTTCCCGAAAGCTCATAAGAATCAGGTACCAAGCCTACAGTATCTAGCACTAACAGTAGTGAGTCATGTCAGATCCCAGGGAGAGGATCCCACCTGGAAACAGTGGAGAGGAAACAGTAGGCGAGGCCTTCGACTGGCTAGAAAGAACAGTAGAAGAAATAAACAGGGCAGCAGTGAATCATTTGCCGAGGGAGTTAATTTTCCAGGTTTGGCGAAGGTCCTGGGAATACTGGCATGATGAAATAGGGATGTCAGCCAGCTACACAAAATATAGATACTTGTGCTTGATACAAAAAGCTTTGTTTATGCATTGCAAGAAAGGGTGTAGGTGCTTAGGAGGAGAGCATGGGGCAGGGGGATGGAGACCAGGGCCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAAATGACAGAAAGACCTCCAGAAGATGAAGCCCCACAGAGGGAACCGTGGGATGAATGGGTAGTAGAAGTTCTGGAGGAAGTAAAAGAAGAAGCCCTGAAACATTTTGATCCTCGCTTGCTAACTGCGCTTGGTAACTATATCTATGATAGACATGGAGACACCCTTGAAGGAGCAGGAGAGCTCATTAAAATCCTCCAGAGAGCACTCTTCATCCATTTCAGAGGTGGATGCAACCACTCCAGAATCGGCCACTCTGGAGGAGGAAATCCTCTCTCAACTATACCGCCCTCTAGAGGCGTGCTATAACAAGTGCTACTGTAAGAAGTGTTGCTATCATTGTCAGCATTGTTTTCTTAAAAAGGGTTTGGGAATATGCTATGAGCAGCAACGAAGAAGAACTCCGAAGAAGACTAAGGCTAATACATTTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCGCTCTTGCTATTAAGTGCTTTAGGGATTTCTTGTGTTCAATATGTAACAGTGTTCTATGGTGTACCAGCATGGAAGAATGCGACAATTCCCCTCTTCTGTGCAACCAAGAATAGGGATACTTGGGGAACAACACAATGCTTGCCAGATAATGATGATTACTCAGAATTGGCAATTAATGTCACAGAGGCTTTTGATGCTTGGGATAATACAGTCACAGAACAAGCAATAGAGGATGTGTGGAACCTCTTTCAAACATCCATTAAGCCCTGTGTAAAACTTACCCCACTATGTATAGCAATGAGGTGTAATAAAACTGAAACAGATAGATGGGGCTTAACAGGAAAACCAACAACAACAGCATCAACAACAACAAAAACAACATCAAAACCATCAGTAATAACAGCAAAGGTTATAAATGAAGGTGATCCATGCATAAAAAATAATAGTTGTGCAGGCTTGGAACAAGAACCCATGATAGGTTGTAAATTTAACATGACAGGGTTAAGAAAGGACAAACAGAGAGAATATAATGAAACATGGTATTCAAGAGATATAGTTTGTGAACAAAATAGCAATGAACATGAAACTGCCAGTAAATGTTATATGAACCATTGTAACACTAGTGTTATTCGAGAATCCTGTGACAAGCATTATTGGGATGCTATTAGATTTAGATATTGTGCTCCGCCAGGTTATGCTTTGCTTAGGTGTAATGATTCAAATTATTCAGGCTTTGAACCTAACTGTACTAAGGTAGTAGTTTCTTCATGCACAAGAATGATGGAAACACAAACCTCTACTTGGTTTGGTTTCAATGGTACTAGAGCAGAAAATAGAACATACATTTATTGGCATGGTAGAAGCAATAGAACCATAATTAGCTTAAATAAGTATTATAATCTAACAATAAGATGTAGGAGACCAGGAAATAAGACAGTCTTACCAGTCACCATTATGTCAGGGTTGGTCTTCCATTCGCAACCCATAAATGAGAGACCAAAACAGGCCTGGTGCTGGTTTGGAGGAAACTGGAAAGGGGCTATCCGAGAAGTGAAGGAAACCTTGGTCAAACATCCCAGGTATACGGGAACTAATAATACTGAGAAGATTAATCTAACAGCTCCAGCAGGAGGAGATCCGGAAGTTACTTTCATGTGGACAAATTGTCGAGGAGAATTCTTATATTGCAAAATGAATTGGTTTCTTAATTGGGTAGATGAGACAAGTGGTTTTAGATGGAATAAACAAAACCCGAAGGAGAAGAAAAGGAGGAATTATGTGCCATGTCATATTAGACAGGTAATTAATACGTGGCACAGGGTAGGCAAAAATGTGTATTTGCCTCCTAGGGAAGGAGACCTGACATGTAATTCCACTGTAACTAGCCTCATAGCAGAAATAGATTGGATCGATAAAAATGAGACCAATATCACCATGAGTGCAGAGGTGGCAGAGCTGTATCGATTGGAGTTGGGAGATTACAAATTAGTAGAAATTACTCCAATTGGCTTGGCCCCCACAAGTGTAAGAAGGTACACCACAACCGGTGCCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCAACAGCAGGTTCTGCAATGGGCGCGGCGTCGCTGACGCTGTCCGCTCAGTCCCGGACTTTGTTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGATGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACTAAGAACCTCCAGACTAGAGTCACTGCTATCGAGAAGTACCTAAAGGATCAGGCGCAGCTAAATTCATGGGGATGTGCTTTTAGGCAGGTCTGCCACACTACTGTACCATGGCCAAATGACACATTGGTACCTAATTGGAACAATATGACTTGGCAAGAGTGGGAAAGACAGGTTGACTTCCTAGAGGCAAATATAACTCAATTATTGGAAGAAGCACAAATTCAGCAAGAAAAGAATATGTATGAGTTGCAAAAATTAAATAGCTGGGATATCTTTGGCAATTGGTTTGACCTTACTTCTTGGATAAGATATATACAATATGGTGTACTTATAGTTCTAGGAGTAATAGGATTAAGAATAGTGATATATGTAGTGCAGATGTTAGCTAGGTTAAGACAAGGTTATAGGCCAGTGTTCTCTTCCCCTCCCGTTTATGTTCAGCAGATCCCTATCCAGAAGGGCCAGGAACCGCCAACCAAAGAAGGAGAAGAAGGAGACGGTGGAGACAGAGGTGGCAACAGATCTTGGCCTTGGCAGATAGAATATATTCATTTCCTGATCCGCCAGCTAATACGCCTCTTGAGTTGGCTATTCAACAGTTGCAGAGATTGGCTATTGAGGAGCTACCAGATCCTCCAGCCAGTGCTCCAGAGCCTCTCAAGGATACTGCAGAGAGTCCGTGAAGTCATCAGAGTTGAGATAACCTACCTACAGTATGGGTGGCGTTACTTCCAAGAAGCAGCGCAAGCATGGTGGAAATTTGCGCGAGAGACTCTTGCAAGCGCGTGGGGAGACTTATGGGAGACTCTGGGACGGGTTGGAAGGAGATTACTCGCAATCCCAAGACGGATCAGGCAGGGGCTTGAGCTCACTCTCTTGTGAGCCTCAGAAATATTGTGAGGGTCAATTTATGAATACCCCTTGGAGAAACCCAAGAGCAGAAGGAGCAAAATTAGATTATAGACAACAAAACATGGATGATGTGGATGATGATGATGATGACTTAGTAGGTTTTCCAGTGACCCCAAAAGTCCCCTTAAGGACCATGACATACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGATAGGAGACATAAAATATTGAATCTGTACTTAGAAAAGGAAGAAGGAATAATACCAGATTGGCAAAATTACACAGCAGGGCCAGGAATCAGATACCCTATGTGTTTTGGATGGCTCTGGAAATTAGTCCCAGTAGATGTCTCAGATGAAGCTCAGGAGGACGAGGCACATTGCTTGATGCATCCAGCACAGACCTCTCAGTGGGATGACCCCTGGGGAGAGGTACTGGCATGGAAGTTTGATCCAGAGTTAGCTTATAACTATAAGGCATTTGTTAAGCACCCAGAAGAGTTTGGTAGTAGCTCAGGCTTGTCAGAGGAAGAGGTAAAGAGAAGGCTAACCGCAAGAGGCCTTTTAAAAATGGCTGACAAGAAGGAAACAAGCTGAGACAGCAGGGACTTTCCACAAAGGGGATGTTATGGGGAGGTACTGGGGAGGAGCTGGCTGGAACGCCCACTTATTCTATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGCTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCTAGTGTGTGTTCCCATCTCTCCTAGCCGCCGCCTGGTCAACTCGGTACTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCA'),
('SIVmac239deltaNef', 'Virus', 'SIVmac239deltaNef', 'RNA', 'SIV', 'GCATGCACATTTTAAAGGCTTTTGCTAAATATAGCCAAAAGTCCTTCTACAAATTTTCTAAGAGTTCTGATTCAAAGCAGTAACAGGCCTTGTCTCATCATGAACTTTGGCATTTCATCTACAGCTAAGTTTATATCATAAATAGTTCTTTACAGGCAGCACCAACTTATACCCTTATAGCATACTTTACTGTGTGAAAATTGCATCTTTCATTAAGCTTACTGTAAATTTACTGGCTGTCTTCCTTGCAGGTTTCTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATATACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTATTTAATGCATCCAGCTCAAACTTCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTGGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAAACAGCAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGCTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCTAGTGTGTGTTCCCATCTCTCCTAGCCGCCGCCTGGTCAACTCGGTACTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCAGATTGGCGCCTGAACAGGGACTTGAAGGAGAGTGAGAGACTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACCAACCACGACGGAGTGCTCCTATAAAGGCGCGGGTCGGTACCAGACGGCGTGAGGAGCGGGAGAGGAAGAGGCCTCCGGTTGCAGGTAAGTGCAACACAAAAAAGAAATAGCTGTCTTTTATCCAGGAAGGGGTAATAAGATAGAGTGGGAGATGGGCGTGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGCTACGACCCAACGGAAAGAAAAAGTACATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTAGATAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGATGTCAAAAAATACTTTCGGTCTTAGCTCCATTAGTGCCAACAGGCTCAGAAAATTTAAAAAGCCTTTATAATACTGTCTGCGTCATCTGGTGCATTCACGCAGAAGAGAAAGTGAAACACACTGAGGAAGCAAAACAGATAGTGCAGAGACACCTAGTGGTGGAAACAGGAACAACAGAAACTATGCCAAAAACAAGTAGACCAACAGCACCATCTAGCGGCAGAGGAGGAAATTACCCAGTACAACAAATAGGTGGTAACTATGTCCACCTGCCATTAAGCCCGAGAACATTAAATGCCTGGGTAAAATTGATAGAGGAAAAGAAATTTGGAGCAGAAGTAGTGCCAGGATTTCAGGCACTGTCAGAAGGTTGCACCCCCTATGACATTAATCAGATGTTAAATTGTGTGGGAGACCATCAAGCGGCTATGCAGATTATCAGAGATATTATAAACGAGGAGGCTGCAGATTGGGACTTGCAGCACCCACAACCAGCTCCACAACAAGGACAACTTAGGGAGCCGTCAGGATCAGATATTGCAGGAACAACTAGTTCAGTAGATGAACAAATCCAGTGGATGTACAGACAACAGAACCCCATACCAGTAGGCAACATTTACAGGAGATGGATCCAACTGGGGTTGCAAAAATGTGTCAGAATGTATAACCCAACAAACATTCTAGATGTAAAACAAGGGCCAAAAGAGCCATTTCAGAGCTATGTAGACAGGTTCTACAAAAGTTTAAGAGCAGAACAGACAGATGCAGCAGTAAAGAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCAGATTGCAAGCTAGTGCTGAAGGGGCTGGGTGTGAATCCCACCCTAGAAGAAATGCTGACGGCTTGTCAAGGAGTAGGGGGGCCGGGACAGAAGGCTAGATTAATGGCAGAAGCCCTGAAAGAGGCCCTCGCACCAGTGCCAATCCCTTTTGCAGCAGCCCAACAGAGGGGACCAAGAAAGCCAATTAAGTGTTGGAATTGTGGGAAAGAGGGACACTCTGCAAGGCAATGCAGAGCCCCAAGAAGACAGGGATGCTGGAAATGTGGAAAAATGGACCATGTTATGGCCAAATGCCCAGACAGACAGGCGGGTTTTTTAGGCCTTGGTCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCTCAAGTGCATCAGGGGCTGATGCCAACTGCTCCCCCAGAGGACCCAGCTGTGGATCTGCTAAAGAACTACATGCAGTTGGGCAAGCAGCAGAGAGAAAAGCAGAGAGAAAGCAGAGAGAAGCCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGGAGACCAGTAGTCACTGCTCATATTGAAGGACAGCCTGTAGAAGTATTACTGGATACAGGGGCTGATGATTCTATTGTAACAGGAATAGAGTTAGGTCCACATTATACCCCAAAAATAGTAGGAGGAATAGGAGGTTTTATTAATACTAAAGAATACAAAAATGTAGAAATAGAAGTTTTAGGCAAAAGGATTAAAGGGACAATCATGACAGGGGACACCCCGATTAACATTTTTGGTAGAAATTTGCTAACAGCTCTGGGGATGTCTCTAAATTTTCCCATAGCTAAAGTAGAGCCTGTAAAAGTCGCCTTAAAGCCAGGAAAGGATGGACCAAAATTGAAGCAGTGGCCATTATCAAAAGAAAAGATAGTTGCATTAAGAGAAATCTGTGAAAAGATGGAAAAGGATGGTCAGTTGGAGGAAGCTCCCCCGACCAATCCATACAACACCCCCACATTTGCTATAAAGAAAAAGGATAAGAACAAATGGAGAATGCTGATAGATTTTAGGGAACTAAATAGGGTCACTCAGGACTTTACGGAAGTCCAATTAGGAATACCACACCCTGCAGGACTAGCAAAAAGGAAAAGAATTACAGTACTGGATATAGGTGATGCATATTTCTCCATACCTCTAGATGAAGAATTTAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAGCCAGGAAAACGATACATTTATAAGGTTCTGCCTCAGGGATGGAAGGGGTCACCAGCCATCTTCCAATACACTATGAGACATGTGCTAGAACCCTTCAGGAAGGCAAATCCAGATGTGACCTTAGTCCAGTATATGGATGACATCTTAATAGCTAGTGACAGGACAGACCTGGAACATGACAGGGTAGTTTTACAGTCAAAGGAACTCTTGAATAGCATAGGGTTTTCTACCCCAGAAGAGAAATTCCAAAAAGATCCCCCATTTCAATGGATGGGGTACGAATTGTGGCCAACAAAATGGAAGTTGCAAAAGATAGAGTTGCCACAAAGAGAGACCTGGACAGTGAATGATATACAGAAGTTAGTAGGAGTATTAAATTGGGCAGCTCAAATTTATCCAGGTATAAAAACCAAACATCTCTGTAGGTTAATTAGAGGAAAAATGACTCTAACAGAGGAAGTTCAGTGGACTGAGATGGCAGAAGCAGAATATGAGGAAAATAAAATAATTCTCAGTCAGGAACAAGAAGGATGTTATTACCAAGAAGGCAAGCCATTAGAAGCCACGGTAATAAAGAGTCAGGACAATCAGTGGTCTTATAAAATTCACCAAGAAGACAAAATACTGAAAGTAGGAAAATTTGCAAAGATAAAGAATACACATACCAATGGAGTGAGACTATTAGCACATGTAATACAGAAAATAGGAAAGGAAGCAATAGTGATCTGGGGACAGGTCCCAAAATTCCACTTACCAGTTGAGAAGGATGTATGGGAACAGTGGTGGACAGACTATTGGCAGGTAACCTGGATACCGGAATGGGATTTTATCTCAACACCACCGCTAGTAAGATTAGTCTTCAATCTAGTGAAGGACCCTATAGAGGGAGAAGAAACCTATTATACAGATGGATCATGTAATAAACAGTCAAAAGAAGGGAAAGCAGGATATATCACAGATAGGGGCAAAGACAAAGTAAAAGTGTTAGAACAGACTACTAATCAACAAGCAGAATTGGAAGCATTTCTCATGGCATTGACAGACTCAGGGCCAAAGGCAAATATTATAGTAGATTCACAATATGTTATGGGAATAATAACAGGATGCCCTACAGAATCAGAGAGCAGGCTAGTTAATCAAATAATAGAAGAAATGATTAAAAAGTCAGAAATTTATGTAGCATGGGTACCAGCACACAAAGGTATAGGAGGAAACCAAGAAATAGACCACCTAGTTAGTCAAGGGATTAGACAAGTTCTCTTCTTGGAAAAGATAGAGCCAGCACAAGAAGAACATGATAAATACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGATTACCCAGAATAGTGGCCAGACAGATAGTAGACACCTGTGATAAATGTCATCAGAAAGGAGAGGCTATACATGGGCAGGCAAATTCAGATCTAGGGACTTGGCAAATGGATTGTACCCATCTAGAGGGAAAAATAATCATAGTTGCAGTACATGTAGCTAGTGGATTCATAGAAGCAGAGGTAATTCCACAAGAGACAGGAAGACAGACAGCACTATTTCTGTTAAAATTGGCAGGCAGATGGCCTATTACACATCTACACACAGATAATGGTGCTAACTTTGCTTCGCAAGAAGTAAAGATGGTTGCATGGTGGGCAGGGATAGAGCACACCTTTGGGGTACCATACAATCCACAGAGTCAGGGAGTAGTGGAAGCAATGAATCACCACCTGAAAAATCAAATAGATAGAATCAGGGAACAAGCAAATTCAGTAGAAACCATAGTATTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAATTAACATGATCACTACAGAACAAGAGATACAATTTCAACAATCAAAAAACTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAACTGTGGAAGGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCTTAAAGGTAGGGACAGACATTAAGGTAGTACCCAGAAGAAAGGCTAAAATTATCAAAGATTATGGAGGAGGAAAAGAGGTGGATAGCAGTTCCCACATGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATAAAATATCTGAAATATAAAACTAAAGATCTACAAAAGGTTTGCTATGTGCCCCATTTTAAGGTCGGATGGGCATGGTGGACCTGCAGCAGAGTAATCTTCCCACTACAGGAAGGAAGCCATTTAGAAGTACAAGGGTATTGGCATTTGACACCAGAAAAAGGGTGGCTCAGTACTTATGCAGTGAGGATAACCTGGTACTCAAAGAACTTTTGGACAGATGTAACACCAAACTATGCAGACATTTTACTGCATAGCACTTATTTCCCTTGCTTTACAGCGGGAGAAGTGAGAAGGGCCATCAGGGGAGAACAACTGCTGTCTTGCTGCAGGTTCCCGAGAGCTCATAAGTACCAGGTACCAAGCCTACAGTACTTAGCACTGAAAGTAGTAAGCGATGTCAGATCCCAGGGAGAGAATCCCACCTGGAAACAGTGGAGAAGAGACAATAGGAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAGGAGATAAACAGAGAGGCGGTAAACCACCTACCAAGGGAGCTAATTTTCCAGGTTTGGCAAAGGTCTTGGGAATACTGGCATGATGAACAAGGGATGTCACCAAGCTATGTAAAATACAGATACTTGTGTTTAATACAAAAGGCTTTATTTATGCATTGCAAGAAAGGCTGTAGATGTCTAGGGGAAGGACATGGGGCAGGGGGATGGAGACCAGGACCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAATGGAAGAAAGACCTCCAGAAAATGAAGGACCACAAAGGGAACCATGGGATGAATGGGTAGTGGAGGTTCTGGAAGAACTGAAAGAAGAAGCTTTAAAACATTTTGATCCTCGCTTGCTAACTGCACTTGGTAATCATATCTATAATAGACATGGAGACACCCTTGAGGGAGCAGGAGAACTCATTAGAATCCTCCAACGAGCGCTCTTCATGCATTTCAGAGGCGGATGCATCCACTCCAGAATCGGCCAACCTGGGGGAGGAAATCCTCTCTCAGCTATACCGCCCTCTAGAAGCATGCTATAACACATGCTATTGTAAAAAGTGTTGCTACCATTGCCAGTTTTGTTTTCTTAAAAAAGGCTTGGGGATATGTTATGAGCAATCACGAAAGAGAAGAAGAACTCCGAAAAAGGCTAAGGCTAATACATCTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCCATCTTGCTTTTAAGTGTCTATGGGATCTATTGTACTCTATATGTCACAGTCTTTTATGGTGTACCAGCTTGGAGGAATGCGACAATTCCCCTCTTTTGTGCAACCAAGAATAGGGATACTTGGGGAACAACTCAGTGCCTACCAGATAATGGTGATTATTCAGAAGTGGCCCTTAATGTTACAGAAAGCTTTGATGCCTGGAATAATACAGTCACAGAACAGGCAATAGAGGATGTATGGCAACTCTTTGAGACCTCAATAAAGCCTTGTGTAAAATTATCCCCATTATGCATTACTATGAGATGCAATAAAAGTGAGACAGATAGATGGGGATTGACAAAATCAATAACAACAACAGCATCAACAACATCAACGACAGCATCAGCAAAAGTAGACATGGTCAATGAGACTAGTTCTTGTATAGCCCAGGATAATTGCACAGGCTTGGAACAAGAGCAAATGATAAGCTGTAAATTCAACATGACAGGGTTAAAAAGAGACAAGAAAAAAGAGTACAATGAAACTTGGTACTCTGCAGATTTGGTATGTGAACAAGGGAATAACACTGGTAATGAAAGTAGATGTTACATGAACCACTGTAACACTTCTGTTATCCAAGAGTCTTGTGACAAACATTATTGGGATGCTATTAGATTTAGGTATTGTGCACCTCCAGGTTATGCTTTGCTTAGATGTAATGACACAAATTATTCAGGCTTTATGCCTAAATGTTCTAAGGTGGTGGTCTCTTCATGCACAAGGATGATGGAGACACAGACTTCTACTTGGTTTGGCTTTAATGGAACTAGAGCAGAAAATAGAACTTATATTTACTGGCATGGTAGGGATAATAGGACTATAATTAGTTTAAATAAGTATTATAATCTAACAATGAAATGTAGAAGACCAGGAAATAAGACAGTTTTACCAGTCACCATTATGTCTGGATTGGTTTTCCACTCACAACCAATCAATGATAGGCCAAAGCAGGCATGGTGTTGGTTTGGAGGAAAATGGAAGGATGCAATAAAAGAGGTGAAGCAGACCATTGTCAAACATCCCAGGTATACTGGAACTAACAATACTGATAAAATCAATTTGACGGCTCCTGGAGGAGGAGATCCGGAAGTTACCTTCATGTGGACAAATTGCAGAGGAGAGTTCCTCTACTGTAAAATGAATTGGTTTCTAAATTGGGTAGAAGATAGGAATACAGCTAACCAGAAGCCAAAGGAACAGCATAAAAGGAATTACGTGCCATGTCATATTAGACAAATAATCAACACTTGGCATAAAGTAGGCAAAAATGTTTATTTGCCTCCAAGAGAGGGAGACCTCACGTGTAACTCCACAGTGACCAGTCTCATAGCAAACATAGATTGGATTGATGGAAACCAAACTAATATCACCATGAGTGCAGAGGTGGCAGAACTGTATCGATTGGAATTGGGAGATTATAAATTAGTAGAGATCACTCCAATTGGCTTGGCCCCCACAGATGTGAAGAGGTACACTACTGGTGGCACCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCAACGGCAGGTTCTGCAATGGGCGCGGCGTCGTTGACGCTGACCGCTCAGTCCCGAACTTTATTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGACGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACAAAGAACCTCCAGACTAGGGTCACTGCCATCGAGAAGTACTTAAAGGACCAGGCGCAGCTGAATGCTTGGGGATGTGCGTTTAGACAAGTCTGCCACACTACTGTACCATGGCCAAATGCAAGTCTAACACCAAAGTGGAACAATGAGACTTGGCAAGAGTGGGAGCGAAAGGTTGACTTCTTGGAAGAAAATATAACAGCCCTCCTAGAGGAGGCACAAATTCAACAAGAGAAGAACATGTATGAATTACAAAAGTTGAATAGCTGGGATGTGTTTGGCAATTGGTTTGACCTTGCTTCTTGGATAAAGTATATACAATATGGAGTTTATATAGTTGTAGGAGTAATACTGTTAAGAATAGTGATCTATATAGTACAAATGCTAGCTAAGTTAAGGCAGGGGTATAGGCCAGTGTTCTCTTCCCCACCCTCTTATTTCCAGCAGACCCATATCCAACAGGACCCGGCACTGCCAACCAGAGAAGGCAAAGAAAGAGACGGTGGAGAAGGCGGTGGCAACAGCTCCTGGCCTTGGCAGATAGAATATATTCATTTCCTGATCCGCCAACTGATACGCCTCTTGACTTGGCTATTCAGCAACTGCAGAACCTTGCTATCGAGAGTATACCAGATCCTCCAACCAATACTCCAGAGGCTCTCTGCGACCCTACAGAGGATTCGAGAAGTCCTCAGGACTGAACTGACCTACCTACAATATGGGTGGAGCTATTTCCATGAGGCGGTCCAGGCCGTCTGGAGATCTGCGACAGAGACTCTTGCGGGCGCGTGGGGAGACTTATGGGAGACTCTTAGGAGAGGTGGAAGATGGATACTCGCAATCCCCAGGAGGATTAGACAAGGGCTTGAGCTCACTCTCTTGTGAGGGACAGGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATATACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTATTTAATGCATCCAGCTCAAACTTCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTGGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAAACAGCAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGCTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCTAGTGTGTGTTCCCATCTCTCCTAGCCGCCGCCTGGTCAACTCGGTACTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCA'),
('SIVsmE041-1', 'Virus', 'SIVsmE041-1', 'RNA', 'SIV', 'ACAGGGACTTGAAGGAGAGTGAGAGCTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACAAACCACGACGGAGTGCTCCTATAAAGGCGCGGGCCGGTACCAGGCGGCGTGAGGAGCGGGAGTCGGAGAGGCCTCCGGTTGCAGGTAAGTGCAACAAAAGAGTCATAGGACTGAGTTCCCTACTTTTGAGGAAAGAGTAGGAGAGTGGGAGATGGGCGCGAGAAACTCCGTCTTGTCAGGGAAAAARGCAGATGAATTAGAAAAAATTAGGTTACGGCCCGGCGGAARGAAAAAGTACATGCTGAAGCATGTAGTRTGGGCAGCAAACGAATTGGACAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGTTGTCAAAAAATTCTTTCAGTCTTAGCTCCATTAGTTCCGACAGGTTCAGAAAATTTAAAGAGCCTTTATAATACTGTCTGCGTCATTTGGTGCATTCACGCAGAAGAGAAAGTGAAACATACTGAGGAAGCAAAACAAATAGTGCAGAGACATCTAGTGGTRGAAACAGGAACAGCAGACAAAATGCCAGYAACAAGTAGACCAACAGCACCACCTAGTGGCAGAGGAGGAAATTACCCAGTGCAGCAAGTAGGTGGCAATTATACCCACCTACCYTTAAGTCCAAGAACATTAAATGCTTGGGTAAAATTGATAGAAGAGAAAAAATTTGGGGCAGAAGTAGTGCCAGGATTCCAAGCACTATCAGAAGGCTGCACTCCCTATGACATCAATCAGATGYTAAATTGTGTRGGGGAACATCAATCAGCCATGCAAATTATTAGAGAAATTATAAATGAAGAAGCTGCTGATTGGGATTTACAACACCCRCAGCCAGGYCCAATACCAGCAGGACAACTTAGAGATCCGAGAGGATCAGACATTGCAGGAACTACTAGCACAGTAGAAGAACAAATTCAATGGATGTATAGGCAGCAAAACCCTATACCAGTAGGTAACATTTACAGAAGGTGGATCCAATTAGGGCTGCAAAAATGTGTAAGGATGTATAATCCAACAAACATTTTAGATGTGAAACAAGGACCAAAAGAGCCATTTCAAAGCTATGTAGATAGRTTCTACAAGAGTYTAAGAGCAGAACAAACAGACCCAGCAGTGAAAAATTGGATGACTCAAACACTGCTGATTCAGAATGCTAACCCGGATTGCAAATTGGTGCTCAARGGTCTGGGTATGAATCCCACTTTAGAAGAAATGCTGACAGCCTGTCAGGGAGTAGGAGGACCAGGACAAAAAGCTAGACTAATGGCAGAAGCCTTGAARGAGGCGCTGACGCCAGGGCAACTCCCATTTGCAGCAGTCCAACAGAGAGGACAAAGAAAGACAATTAAATGYTGGAATTGTGGAAAGGAGGGACACTCTGCGAGACARTGCAGAGCCCCTAGAAGACAGGGMTGCTGGAAGTGTGGAAAAACAGGCCATGTTATGGCCAAATGCCCCGARAGACAGGCGGGTTTTTTAGGGCTTGGCCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCCCAGATACCTCAGGGGTTGACACCAACTGCTCCCCCAGAGGATCCAGCTGTGGATCTACTGAGGAACTAYATGAAGATGGGCAGAAGGCAGAGGGAGAACAGAGAGAGACCTTACAAGGAGGTGACGGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGAAGACCAGTAGTTACTGCCYACATTGAAGAACAGCCCRTAGAAGTATTATTAGATACAGGGGCTGATGATTCAATYGTAGCAGGGATAGAATTGGGTCCAAATTATACCCCTAAAATAGTAGGAGGRATAGGAGGTTTCATTAACACCAAGGAATATAAAGATGTAAAAATAAAAGTCTTAGGCAARGTRATTAAGGGAACAATTATGACAGGAGATACCCCAATTAACATTTTTGGCAGAAATCTGCTAACAGCTATGGGCATGTCTCTAAATCTCCCCATAGCTAAGGTRGAACCTATCAAAGTAACACTAAAACCAGGAAAAGATGGACCAAAATTAAGACAGTGGCCRCTATCAAAAGAAAAGATAATTGCATTAAGAGAAATCTGTGAAAAAATGGAAAAAGATGGCCAGTTAGAGGAAGCCCCTCCAACCAATCCATATAACACCCCCACATTTGCTATAAAGAAGAAAGACAAAAATAAATGGAGGATGCTAATAGACTTTAGAGAATTAAACAAGGTTACTCAAGATTTTACAGAAGTACAGTTAGGAATACCACACCCTGCAGGACTAGCAAAGAGAAGAAGGATCACAGTATTGGATGTAGGTGATGCATATTTTTCCATACCTTTAGATGAGGAATTCAGGCAATACACTGCCTTTACTTTACCATCAGTAAACAATGCAGAACCAGGAAAAAGATACATCTATAAGGTATTACCTCAAGGGTGGAAAGGATCACCAGCTATTTTTCAGCATACTATGAGAAATGTCTTAGAACCTTTCAGAAAAGCAAATCCAGATGTGACCCTGATCCAATAYATGGATGACATCCTAATAGCTAGTGATAGAACAGAYTTAGAACATGACAGGGTAGTTTTACAGTTAAAGGAACTTCTAAACAGTATGGGATTTTCCACCCCAGAAGAGAAGTTCCAGAAAGATCCCCCATTCCAGTGGATGGGATATGAATTGTGGCCAACCAAATGGAAACTGCAAAAAATAGAGTTGCCACARARAGAAACCTGGACARTAAATGATATACAAAAATTAGTAGGAGTGCTAAATTGGGCAGCACAAATTTATCCAGGAATAAAGACTAAACACCTTTGCAGATTAATCAGAGGAAAAATGACTTTAACAGAAGAGGTTCAGTGGACTGAGATGGCAGAGGCAGAATATGAAGARAACAAGATAATTCTCAGTCAAGAACAAGAAGGGTGTTAYTATCAAGAGGGAAARCCACTGGAGGCAACAGTAATAAAGAGTCAGGATAATCAATGGTCATATAAAATTCACCAAGAAGACAARATACTAAAAGTAGGCAAATTTGCAAAGATTAAGAATACACATACAAATGGAGTCAGATTATTAGCACATGTAGTACAGAAAATAGGAAAAGAAGCAATAGTAATTTGGGGACAGGTGCCAAAATTTCATYTGCCAGTAGAGAGAGAAATYTGGGAACAATGGTGGACAGATTATTGGCAAGTAACCTGGATACCAGAATGGGACTTTGTATCAACACCTCCCTTAGTCAGATTAGTCTTCAACCTAGTAAAAGAGCCTATACAGGGAGCAGAAACATTTTATGTAGATGGATCCTGTAACAGACAGTCAAAAGAAGGAAAGGCAGGCTATGTGACAGACAGAGGCAGAGACAGAACAAAACCGCTGGAACAGACTACCAATCAACAAGCAGAGYTRGAAGCCTTCCATCTAGCCTTAGCAGATTCAGGACCAAAAGCCAATATAATAGTAGACTCCCAATATGTTATGGGCATAATAGCGGGTCAACCCACTGAATCAGAAAGTAGATTAGTAAATCAGATAATAGAGGAAATGATTAAAAAGGAAGCAATTTATGTAGCGTGGGTACCTGCACATAAAGGAATAGGAGGAAATCAAGAAGTRGATCATCTGGTRAGTCAAGGAATTAGACAAGTCCTATTCTTAGAAAAAATAGAACCAGCGCAAGAAGAGCATGAGAAGTACCATAGCAATGTAAAAGAATTAGTATTCAAATTTGGATTACCTAGGCTAGTAGCAAAACAGATAGTAGACACATGTGATAAATGTCACCAGAAAGGAGARGCCATACATGGACAAGTAAATGCAGAACTAGGGACTTGGCAAATGGACTGTACACACCTAGAGGGCAAAATAATTATAGTTGCAGTACATGTGGCTAGTGGATTCATAGAGGCAGAAGTAATCCCGCAGGAAACAGGAAGACAAACAGCACTGTTTCTGCTAAAATTAGCCAGCAGATGGCCCATCACACATCTGCAYACTGATAATGGTGCCAACTTCACATCGCAAGAAGTGAAAATGGTTGCTTGGTGGGCAGGGATTGAACAGACCTTTGGGGTGCCTTATAATCCACAGAGCCAGGGAGTRGTGGAAGCAATGAACCATCATCTAAAAACCCAGATAGATAGAATYAGGGAACAGGCAAATTCAATAGARACTATAGTACTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAGTCAATATGATCACCACAGAACAAGAAATACAATTCCAACAATCAAAAAATTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGACCAGCTGTGGAAAGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCCTAAAGGTAGGGACAGAAATCAAGGTAGTACCAAGGAGGAAAGCTAAAATTATCAAAGACTATGGAGGAGGAAAAGARTTGGATAGCGGTTCCCACTTGGAGGATACCGGGGAGGCTAGAGAAGTGGCATAGCCTCATCAAACACCTGAAATATAACACTAAAGACCTACAGAAGGCTTGTTATGTACCCCATCATAAAGTTGGATGGGCATGGTGGACTTGCAGCAGGGTRATCTTCCCATTAAGGGATGARTCTCATTTGGAAGTACAAGGATATTGGAATTTGACACCAGAGAAAGGATGGCTCAGTACTTATGCAGTGAGAATAACCTGGTACTCCAGRAATTTCTGGACAGATGTAACACCAGATTATGCAGACACTTTACTGCATGGCACTTATTTCCCTTGCTTTTCAGAGGGAGAAGTACGAAGGGCCATCAGGGGAGAGAAATTGCTGTCTTGCTGCAAGTTCCCGAAAGCTCATAAGAATCAGGTACCAAGCCTACAGTATCTAGCACTAACAGTAGTGAGTCATGTCAGATCCCAGGGAGAGGRTCCCACCTGGAAACAGTGGAGAGGAAACRGTAGGCGAGGCCTTCGACTGGCTRGAAAGAACAGTAGAAGAAATAAACAGGGCAGCAGTGAATCATTTGCCGAGGGAGTTAATTTTCCAGGTTTGGCGAAGGTCCTGGGAATACTGGCATGATGAAATAGGGATGTCAGCCAGCTACACAAAATAYAGATACTTGTGCTTGATACAAAAAGCTTTGTTTATGCATTGCAAGAAAGGGTGTAGGTGCTTAGGAGGAGAGCATGGGGCAGGGGGATGGAGACCAGGGCCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAAATGACAGAAAGACCTCCAGAAGATGAAGCCCCACAGAGGGAACCGTGGGATGAATGGGTAGTAGAAGTTCTGGAGGAAGTAAAAGAAGAAGCCCTGAAACATTTTGATCCTCGCTTGCTAACTGCGCTTGGTAACTATATCTATGATAGACATGGAGACACCCTTGAAGGAGCAGGAGAGCTCATTARAATCCTCCAGAGAGCACTCTTCATCCATTTCAGAGGTGGATGCAACCACTCCAGAATCGGCCACTCTGGAGGAGGAAATCCTCTCTCAACTATACCGCCCTCTAGAGGCGTGCTATAACAAGTGCTACTGTAAGAAGTGTTGCTATCATTGTCAGCATTGTTTTCTTAAAAAGGGTTTGGGAATATGCTATGAGCAGCAACGAAGAAGAACTCCGAAGAAGACTAAGGCTAATACATTTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCGCTCTTGCTATTAAGTGCTTTAGGGATTTCTTGTGTTCAATATGTRACAGTGTTCTATGGTRTACCAGCATGGAAGAATGCGACARTTCCCCTCTTCTGTGCAACYRAGAATAGGGAYACTTGGGGRACAACACAATGCTTGCCAGATAATGATGATTACTCAGAATTGGCAATTAATGTCACAGAGGCTTTTGATGCTTGGGATAATACAGTCACAGAACAAGCAATAGAGGATGTGTGGAACCTCTTTCAAACATCCATTAAGCCCTGTGTAAAACTTACCCCACTATGTATAGCAATGAGGTGTAATAAAACTGAAACAGATAGATGGGGCTTAACAGGAAAACCAACAACAACAGCATCAACAACAACAAAAACAACATCAAAACCATCAGTAATAACAGCAAARGTTATAAATGAAGGTGATCCATGCATAAAAAATAATAGTTGTGCAGGCTTGGAACARGARCCCATGATAGGTTGTAAATTTAACATGACAGGGTTAAGAAAGGACAAACAGAGAGAATATAATGAAACATGGTATTCAAGAGATATAGTTTGTGAACAAAATAGCAATGAAMATGAAACTGCCAGTAAATGTTATATGAACCATTGTAACACTAGTGTTATTCGAGAATCCTGTGACAAGCATTATTGGGATGCTATTAGATTTAGATATTGTGCTCCGCCAGGTTATGCTTTGCTTAGGTGTAATGATTCAAATTATTCAGGCTTTGAACCTAACTGTACTAAGGTAGTAGTTTCTTCATGCACAAGAATGATGGAAACACAAACCTCTACTTGGTTTGGTTTCAATGGTACTAGAGCAGAAAATAGAACATACATTTATTGGCATGGTAGAAGCAATAGAACCATAATTAGCTTAAATAAGTATTATAATCTAACAATRAGATGTAGGAGACCAGGAAATAAGACAGTCTTACCAGTCACCATTATGTCAGGGTTGGTCTTCCATTCGCAACCCATAAATGAGAGRCCAAAACAGGCCTGGTGCTGGTTTGGAGGAAACTGGAAAGGRGCYATCCGAGAAGTGAAGGAAACCTTGGTCAAACATCCCAGGTATACGGGAACTAATAATACTGAGAAGATTAATCTRACAGCTCCAGCAGGAGGAGATCCGGAAGTTACTTTCATGTGGACAAATTGTCGAGGAGAATTCTTATATTGCAAAATGAATTGGTTTCTYAATTGGGTAGATGAGACAARKGGTTTTAGATGGAATAADCAAAACCCGAAGGAGAAGAAAAGGAGGAATTATGTGCCATGTCATATTAGACAGGTAATYAAYACGTGGCACAGRGTAGGCAAAAATGTGTATTTGCCTCCTAGGGAAGGAGACCTGACATGTAATTCCACTGTAACTAGCCTCATAGCAGAAATAGATTGGATCGATAAAAATGAGACCAATATCACCATGAGTGCAGAGGTGGCAGAGCTGTATCGATTGGAGTTGGGAGATTACAAATTAGTAGARATTACTCCAATTGGCTTGGCCCCCACAAGTGTAAGAAGGTACACCACAACCGGTGCCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCAACAGCAGGTTCTGCAATGGGCGCGGCGTCGCTGACGCTGTCCGCTCAGTCCCGGACTTTGTTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGATGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACTAARAACCTCCAGACTAGAGTCACTGCTATCGAGAAGTACCTAAAGGATCAGGCRCATCTAAATTCATGGGGATGTGCTTTTAGGCAGGTCTGCCACACTACTGTACCATGGCCAAATGACACATTGRTGCCTAATTGGGAYAATATGACTTGGCAAGAGTGGGAAAGACAGGTTGACTTCCTAGAGGCAAAYATAACTCAATTACTRGAAGAAGCACAAATTCAGCAAGAAAAGAAYATGTATGAGTTGCAAAAATTAAATAGCTGGGATATCTTTGGCAATTGGTTTGACCTTACTTCTTGGATAARATATATACAATATGGTGTACTTATAGTTCTAGGAGTAATAGGATTAAGAATAGTGATATATGTAGTRCARATGTTAGCTAGGTTAAGACAAGGTTATAGGCCAGTGTTCTCTTCCCCTCCCGTTTATGTTCAGCAGATCCCTATCCAGAAGGGCCAGGAACCGCCAACCAAAGAAGGAGAAGAAGGAGACGGTGGAGACAGAGGTGGCAACAGATCTTGGCCTTGGCAGATAGAATAYATTCATTTCCTGATCCGCCAGCTAATACGCCTCTTGAGTTGGCTRTTCAACAGTTGCAGAGWTTGGCTATTGAGGAGCTRCCAGATCCTCCAGCCAGTGCTCCAGAGCCTCTCAAGGATACTGCAGRGAGTCCGTGAAGTCATCAGAGTTGAGATAACCTACCTACAGTATGGGTGGCGTTACTTCCAAGAAGCAGCGCAAGCRTGGTGGAAATTTGCGCGAGAGACTCTTGCAAGCGCGTGGGGAGACTTATGGGAGACTCTGGGACGGGTTGGAAGGAGATTACTCGCAATCCCAAGACGKATCAGGCAGGGGCTTGARCTCACTCTCTTGTGAGCCTCAGAAATATTGTGARGGTCAATTTATGAATACCCCTTGGAGAAACCCAAGAGCAGAAGGAGCAAAATTAGATTATAGACAACAAAACATGGATGATGTGGATGATGATGATRRTGACYTAGTAGGTTTTCCAGTGACCCCAARAGTCCCCTTRAGGACYATGACATACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGATAGGAGACATAAAATATTGAATCTGTACYTAGAAAAGGAAGAAGGAATAATACCAGATTGGCAAAATTACACAGCAGGGCCAGGAATCAGATACCCTATGTGTTTTGGATGGCTCTGGAAATTAGTCCCAGTAGATGTCTCAGATGAAGCTCAGGAGGACGANNCACATTGCTTGATGCATCCAGCACAGACCTCTCAGTGGGATGACCCCTGGGGAGAGGTACTGGCATGGAAGTTTGATCCAGARTTAGCTTATAACTATAAGGCATTTGTTAAGCACCCAGAAGAGTTTGGTAGTAGYTCAGGCTTGTCAGAGGAAGAGGTAAAGAGAAGGCTAACCGCAAGAGGCCTTTTAAAAATGGCTGACAAGAAGGAAACAAGCTGAGACAGCAGGGACTTTCCACAAAGGGGATGTTATGGGGAGGTACTGGGGAGGAGCTGGCTGGAACGCCCACTTATTC'),
('SIVmac239cy0163', 'Virus', 'SIVmac239cy0163', 'RNA', 'SIV', 'NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNCCAGGAAGGGGTAATAAGATAGAGTGGGAGATGGGCGCGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGCTACGACCCAACGGAAAGAAAAAGTACATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTAGATAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGATGTCGAAAAATACTTTCGGTCTTAGCTCCATTAATGCCAACAGGCTCAGAAAATTTAAAAAGCCTTTATAATACTGTCTGCGTCATCTGGTGCATTCACGCAGAAGAGAAAGTGAAACACACTGAGGAAGCAAAACAGATAGTGCAGAGACACCTAGTGGTGGAAACAGGAACAACAGAAACTATGCCAAAAACAAGTAGACCAACAGCACCATCTAGCGGCAGAGGAGGAAATTACCCAGTACAACAAATAGGTGGTAACTATGTCCACCTGCCATTAAGCCCGAGAACATTAAATGCCTGGGTAAAATTGATAGAGGAAAAGAAATTTGGAGCAGAAGTAGTGCCAGGATTTCAGGCACTGTCAGAAGGTTGCACCCCCTATGACATTAATCAGATGTTAAATTGTGTGGGAGACCATCAAGCGGCTATGCAGATTATCAGAGATATTATAAACGAGGAGGCTGCAGATTGGGACTTGCAGCACCCACAACCAGCTCCACAACAAGGACAACTTAGGGAGCCGTCAGGATCAGATATTGCAGGAACAACTAGTTCAGTAGATGAACAAATCCAGTGGATGTACAGACAACAGAACCCCATACCAGTAGGCAACATTTACAGGAGATGGATCCAACTGGGGTTGCAAAAATGTGTCAGAATGTATAACCCAACAAACATTCTAGATGTAAAACAAGGGCCAAAAGAGCCATTTCAGAGCTATGTAGACAGGTTCTACAAAAGTTTAAGAGCAGAACAGACAGATGCAGCAGTAAAGAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCAGATTGCAAGCTAGTGCTGAAGGGGCTGGGTGTGAATCCCACCCTAGAAGAAATGCTGACGGCTTGTCAAGGAGTAGGGGGGCCGGGACAGAAGGCTAGATTAATGGCAGAAGCCCTGAAAGAGGCCCTCGCACCAGTGCCAATCCCTTTTGCAGCAGCCCAACAGAGGGGATCAAGAAAGCCAATTAAGTGTTGGAATTGTGGGAAAGAGGGACACTCTGCAAGGCAATGCAGAGCCCCAAGAAGACAGGGATGCTGGAAATGTGGAAAAATGGACCATGTTATGGCCAAATGCCCAGACAGACAGGCGGGTTTTTTAGGCCTTGGTCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCTCAAGTGCATCAGGGGCTGATGCCAACTGCTCCCCCAGAGGACCCAGCTGTGGATCTGCTAAAGAGCTACATGCAGTTGGGCAAGCAGCAGAGAGAAAAGCAGAGAGAAAGCAGAGAGAAGCCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGGAGACCAGTAGTCACTGCTCATATTGAAGAACAGCCTGTAGAAGTATTACTGGATACAGGGGCTGATGATTCTATTGTAACAGGAATAGAGTTAGGTCCACATTATACCCCAAAAATAGTAGGAGGAATAGGAGGTTTTATTAATACTAAAGAATACAAAAATGTAGAAATAGAAGTTTTAGGCAAAAGGATTAAAGGGACAATCATGACAGGGGACACCCCGATTAACATTTTTGGTAGAAATTTGCTAACAGCTCTGGGGATGTCTCTAAATTTTCCCATAGCTAAAGTAGAGCCTGTAAAAGTCGCCTTAAAGCCAGGAAAGGATGGACCAAAATTGAAGCAGTGGCCATTATCAAAAGAAAAGATAGTTGCATTAAGAGAAATCTGTGAAAAGATGGAAAAGGATGGTCAGTTGGAGGAAGCTCCCCCGACCAATCCATACAACACCCCCACATTTGCTATAAAGAAAAAGGATAAGAACAAATGGAGAATGCTGATAGATTTTAGGGAACTAAATAGGGTCACTCAGGACTTTACGGAAGTCCAATTAGGAATACCACACCCTGCAGGACTAGCAAAAAGGAAAAGAATTACAGTACTGGATATAGGTGATGCATATTTCTCCATACCTCTAGATGAAGAATTTAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAGCCAGGAAAACGATACATTTATAAGGTTCTGCCTCAGGGATGGAAGGGGTCACCAGCCATCTTCCAATACACTATGAGACATGTGCTAGAACCCTTCAGGAAGGCAAATCCAGATGTGACCTTAGTCCAGTATATGGATGACATCTTAATAGCTAGTGACAGGACAGACCTGGAACATGACAGGGTAGTTTTACAGTTAAAGGAACTCTTGAATAGCATAGGGTTTTCTACCCCAGAAGAGAAATTCCAAAAAGATCCCCCATTTCAATGGATGGGGTACGAATTGTGGCCAACAAAATGGAAGTTGCAAAAGATAGAGTTGCCACAAAGAGAGACCTGGACAGTGAATGATATACAGAAGTTAGTAGGAGTATTAAATTGGGCAGCTCAAATTTATCCAGGTATAAAAACCAAACATCTCTGTAGGTTAATTAGAGGAAAAATGACTCTAACAGAGGAAGTTCAGTGGACTGAGATGGCAGAAGCAGAATATGAGGAAAATAAAATAATTCTCAGTCAGGAACAAGAAGGATGTTATTACCAAGAAGGCAAGCCATTAGAAGCCACGGTAATAAAGAGTCAGGACAATCAGTGGTCTTATAAAATTCACCAAGAAGACAAAATACTGAAAGTAGGAAAATTTGCAAAGATAAAGAATACACATACCAATGGAGTGAGACTATTAGCACATGTAATACAGAAAATAGGAAAGGAAGCAATAGTGATCTGGGGACAGATCCCAAAATTCCACTTACCAGTTGAGAAGGATGTATGGGAACAGTGGTGGACAGACTATTGGCAGGTAACCTGGATACCGGAATGGGATTTTATCTCAACACCACCGCTAGTAAGATTAGTCTTCAATCTAGTGAAGGACCCTATAGAGGGAGAAGAAACCTATTATACAGATGGATCATGTAATAAACAGTCAAAAGAAGGGAAAGCAGGATATATCACAGATAGGGGCAAAGACAAAGTAAAAGTGTTAGAACAGACTACTAATCAACAAGCAGAATTGGAAGCATTTCTCATGGCATTGACAGACTCAGGGCCAAAGGCAAATATTATAGTAGATTCACAATATGTTATGGGAATAATAACAGGATGCCCTACAGAATCAGAGAGCAGGCTAGTTAATCAAATAATAGAAGAAATGATTAAAAAGTCAGAAATTTATGTAGCATGGGTACCAGCACACAAAGGTATAGGAGGAAACCAAGAAATAGACCACCTAGTTAGTCAAGGGATTAGACAAGTTCTCTTCTTGGAAAAGATAGAGCCAGCACAAGAAGAACATGATAAATACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGATTACCCAGAATAGTGGCCAGACAGATAGTAGACACCTGTGATAAATGTCATCAGAAAGGAGAGGCTATACATGGGCAGACAAATTCAGATCTAGGGACTTGGCAAATGGATTGTACCCATCTAGAGGGAAAAATAATCATAGTTGCAGTACATGTAGCTAGTGGATTCATAGAAGCAGAGGTAATTCCACAAGAGACAGGAAGACAGACAGCACTATTTCTGTTAAAATTGGCAGGCAGATGGCCTATTACACATCTACACACAGATAATGGTGCTAACTTTGCTTCGCAAGAAGTAAAGATGGTTGCATGGTGGGCAGGGATAGAGCACACCTTTGGGATACCATACAATCCACAGAGTCAGGGAGTAGTGGAAGCAATGAATCACCACCTGAAAAATCAAATAGATAGAATCAGGGAACAAGCAAATTCAGTAGAAACCATAGTATTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAATTAACATGATCACTACAGAACAAGAGATACAATTTCAACAATCAAAAAACTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAACTGTGGAAGGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCTTAAAGGTAGGGACAGACATTAAGGTAGTACCCAGAAGAAAGGCTAAAATTATCAAAGATTATGGAGGAGGAAAAGAGGTGGATAGCAGTTCCCACATGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATAAAATATCTGAAATATAAAACTAAAGATCTACAAAAGGTTTGCTATGTGCCCCATTTTAAGGTCGGATGGGCATGGTGGACCTGCAGCAGAGTAATCTTCCCACTACAGGAAGGAAGCCATTTAGAAGTACAAGGGTATTGGAATTTGACACCAGAAAAAGGGTGGCTCAGTACTTATGCAGTGAGGATAACCTGGTACTCAAAGAACTTTTGGACAGATGTAACACCAAACTATGCAGACATTTTACTGCATAGCACTTATTTCCCTTGCTTTACAGCGGGAGAAGTGAGAAGGGCCATCAGGGGAGAACAACTGCTGTCTTGCTGCAGGTTCCCGAGAGCTCATAAGTACCAGGTACCAAGCCTACAGTACTTAGCACTGAAAGTAGTAAGCGATGTCAGATCCCAGGGAGAGAATCCCACCTGGAAACAGTGGAGAAGAGACAATAGGAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAGGAGATAAACAGAGAGGCGGTAAACCACCTACCAAGGGAGCTGATTTTCCAGGTTTGGCAAAGGTCTTGGGAATACTGGCATGATGAACAAGGGATGTCACCAAGCTATGTAAAATACAGATACTTGTGTTTAATACAAAAGGCTTTATTTATGCATTGCAAGAAAGGCTGTAGATGTCTAGGGGAAGGACATGGGGCAGGGGGATGGAGACCAGGACCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAATGGAAGAAAGACCTCCAGAAAATGAAGGACCACAAAGGGAACCATGGGATGAATGGGTAGTGGAGGTTCTGGAAGAACTGAAAGAAGAAGCTTTAAAACATTTTGATCCTCGCTTGCTAACTGCACTTGGTAATCATATCTATAATAGACATGGAGACACCCTTGAGGGAGCAGGAGAACTCATTAGAATCCTCCAACGAGCGCTCTTCATGCATTTCAGAGGCGGATGCATCCACTCCAGAATCGGCCAACCTGGGGGAGGAAATCCTCTCTCAGCTATACCGCCCTCTAGAAGCATGCTATAACACATGCTATTGTAAAAAGTGTTGCTACCATTGCCAGTTTTGTTTTCTTAAAAAAGGCTTGGGGATATGTTATGAGCAATCACGAAAGAGAAGAAGAACTCCGAAAAAGGCTAAGGCTAATACATCTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCCATCTTGCTTTTAAGTGTCTATGGGATCTATGGCACTCTATATGTCACAGTCTTTTATGGTGTACCAGCTTGGAGGAATGCGACAATTCCCCTCTTTTGTGCAACCAAGAATAGGGATACTTGGGGAACAACTCAGTGCCTACCAGATAATGGTGATTATTCAGAAATGGCCCTTAATGTTACAGAAAGCTTTGATGCCTGGAATAATACAGTCACAGAACAGGCAATAGAGGATGTATGGCAACTCTTTGAGACCTCAATAAAGCCTTGTGTAAAATTATCCCCATTATGCATTACTATGAGATGCAATAAAAGTGAGACAGATAGATGGGGATTGACAAAATCAATAACAACAACAGCATCAACAACATCAACGACAGCATCAGCAAAAGTAGACATGGTCAATGAGACTAGTTCTTGTATAGCCCAGGATAATTGCACAGGCTTGGAACAAGAGCAAATGATAAGCTGTAAATTCAACATGACAGGGTTAAAAAGAGACAAGAAAAAAGAGTACAATGAAACTTGGTACTCTGCAGATTTGGTATGTGAACAAGGGAATAACACTGGTAATGAAAGTAGATGTTACATGAACCACTGTAACACTTCTGTTATCCAAGAGTCTTGTGACAAACATTATTGGGATGCTATTAGATTTAGGTATTGTGCACCTCCAGGTTATGCTTTGCTTAGATGTAATGACACAAATTATTCAGGCTTTATGCCTAATTGTTCTAAGGTGGTGGTCTCTTCATGCACAAGGATGATGGAGACACAGACTTCTACTTGGTTTGGCTTTAATGGAACTAGAGCAGAAAATAGAACTTATATTTACTGGCATGGTAGGGATAATAGGACTATAATTAGTTTAAATAAGTATTATAATCTAACAATGAAATGTAGAAGACCAGGAAATAAGACAGTTTTACCAGTCACCATTATGTCTGGATTGGTTTTCCACTCACAACCAATCAATGATAGGCCAAAGCAGGCATGGTGTTGGTTTGGAGGAAAATGGAAGGATGCAATAAAAGAGGTGAAGCAGACCATTGTCAAACATCCCAGGTATACTGGAACTAACAATACTGATAAAATCAATTTGACGGCTCCTGGAGGAGGAGATCCGGAAGTTACCTTCATGTGGACAAATTGCAGAGGAGAGTTCCTCTACTGTAAAATGAATTGGTTTCTAAATTGGGTAGAAGATAGGAATACAGCTAACCAGACGTCAAAGGAACAGCATAAAAGAAATTACGTGCCATGTCATATTAGACAAATAATCAACACTTGGCATAAAGTAGGCAGAAATGTTTATTTGCCTCCAAGAGAGGGAGACCTCACGTGTAACTCCACAGTGACCAGTCTCATAGCAAACATAGATTGGATTGATGGAAACCAAACTAATATCACCATGAGTGCAGAGGTGGCAGAACTGTATCGATTGGAATTGGGAGATTATAAATTAGTAGAGATCACTCCAATTGGCTTGGCCCCCACAAATGTGAAGAGGTACACTACTGGTGGCACCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCAACGGCAGGTTCTGCAATGGGCGCGGCGTCGTTGACGCTGACCGCTCAGTCCCGAACTTTATTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGACGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACAAAGAACCTCCAGACTAGGGTCACTGCCATCGAGAAGTACTTAAAGGACCAGGCGCAGCTGAATGCTTGGGGATGTGCGTTTAGACAAGTCTGCCACACTACTGTACCATGGCCAAATGCAAGTCTAACACCAGAGTGGAACAATGAGACTTGGCAAGAGTGGGAGCGAAAGGTTGACTTCTTGGAGGAAAATATAACAGCCCTCCTAGAGGAGGCACAAATTCAACAAGAGAGGAACATGTATGAATTACAAAAGTTGAATAGCTGGGATGTGTTTGGCAATTGGTTTGACCTTGCTTCTTGGATAAAGTATATACAATATGGAGTTTATATAGTTGTAGGAGTAATACTGTTAAGAATAGTGATCTATATAGTACAAATGCTAGCTAAGTTAAGGCAGGGGTATAGGCCAGTGTTCTCTTCCCCACCCTCTTATTTCCAGCAGACCCATATCCAACAGGACCCGGCACTGCCAACCAGAGAAGGCAAAGAAGGAGACGGTGGAGAAGGCGGTGGCAACAGCTCCTGGCCTTGGCAGATAGAATATATTCATTTCCTGGTCCGTCAACTGATACGCCTCTTGACTTGGCTATTCAGCAACTGCAGAACCTTGCTATCGAGAGTATACCAGGTCCTCCAACCAATACTCCAGAGGCTCTCTGCGACCCTACAGAGGATTCGAGAAGTCCTCAGGACTGAACTGACCTACCTACAATATGGGTGGAGCTATTTCCATGAGGCGGTCCAGGCCGTCTGGAGATCTGCGACAGAGACTCTTGCGGGCGCGTGGGGAGACTTATGGGAGACTCTTAGGAGAGGTGGAAGATGGATACTCGCAATCCCCAGGAGGATTAGACAAGGGCTTGAGCTCACTCTCTTGTGAGGGACAGAAATACAATCAGGGACAGTATATGAATACTCCATGGAGAAACCCAGCTGAAGAGAGAGAAAAATTAGCATACAGAAAACAAAATATGGATGATATAGATGAGGAAGATGATGACTTGGTAGGGGTATCAGTGAGGTCAAAAGTTCCCCTAAGAACAATGAGTTACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATATACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAAATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTATTTAATGCATCCAGCTCAAACTTCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTGGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAAACAGCAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN'),
('SIVsmE543', 'Virus', 'SIVsmE543', 'RNA', 'SIV', 'TGGAAGGGATTTATTACAATGAGAAAAGACATAGAATATTAGATATGTACATGGAAAAGGAAGAAGGAATAATACCAGATTGGCAAAATTACACATTAGGGCCAGGAACTAGATACCCTATGTACTTTGGGTGGCTCTGGAAATTAGTCCCAGTAGATGTCTCAGATGAAGCCCAGGAAGACGAGACACATTGCCTGGTGCATCCAGCACAGACTCATCAGTGGGATGACCCCTGGGGAGAGGTACTGGCATGGAAGTTTGATCCAGAATTGGCTTATAGCTATAAGGCATTTATTAAGTACCCAGAAGAGTTTGGTAGTAAGTCAGGCTTGTCAGAGGAAGAGGTAAAGAGAAGGCTAACCGCAAGAGGCATTTATAAAATGGCTGACAAGAGGGAAACAAGCTGAGACAGCAGGGACTTTCCACAAGGGACTTTCCACAAGGGGCTGTCATGGGGAGGTACTGGGGAGGAGCTGGCTGGAACGCCCACTTATTCTCTGTATAAATACAACTGCATTTCGCTCTGTAGTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGGCTCCACGCTTGCTTGCTTAAAGACCTCTTCAATAAAGCTGCCATTTAGAAGTAAGCAAGTGTGTGTTCCCATCTCTCCTAGTCGCCGCCTGGTCATCTCGGTACTCGACACATAAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAGGCAGGAAAATCCCTAGCAGGTTGGCGCCCGAACAGGGACTTGAAGGAGGTGAGAGCTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACAAACCACGACGGAGAGCTCCTAGAAAGGCGCGGGCCGGTACCAGGCGGCGTGAGGAGCAGGGAGTCGGAGAGGCCTCCGGTTGCAGGTAAGTGCAACAAAAAGTCATAGGACTGAGTTCCCTACTTTTGAGGAAAGAGTAGGAGAGTGGGAGATGGGCGCGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGTTACGGCCCAACGGAAAGAAAAAGTATATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTGGATAGATTTGGATTAGCAGAAAGCCTGTTGGATAACAAAGAAGGTTGTCAAAAAATTCTTTCGGTTTTAGCTCCATTAGTTCCGACAGGTTCAGAAAATTTAAAGAGCCTTTATAATACTGTCTGCGTCATTTGGTGCATTCACGCAGAAGAGAAAGTGAAACATACTGAGGAAGCAAAACAAATAGTGCAGAGACATCTAGTGGTGGAAACAGGAACAGCAGACAAAATGCCAGCAACAAGCAGACCAACAGCACCACCTAGTGGCAGAGGAGGAAATTACCCAGTGCAGCAAGTAGGTGGCAATTATGTCCACCTACCCTTAAGTCCAAGAACATTAAATGCTTGGGTAAAATTGGTAGAAGAGAAAAAATTTGGGGCAGAGGTAGTGCCAGGATTTCAAGCGCTATCAGAAGGCTGCACTCCCTATGACATCAATCAAATGCTAAATTGTGTAGGAGAACATCAGGCAGCCATGCAAATTATTAGAGAGATTATAAATGAAGAAGCTGCCGATTGGGATTTACAACACCCGCAGCCAGGTCCACTACCAGCAGGGCAACTTAGAGAGCCAAGAGGATCAGACATTGCAGGAACTACTAGTACAGTAGAGGAACAAATCCAATGGATGTACAGGCAACAAAACCCCATACCAGTAGGCAACATTTATAGGAGGTGGATCCAATTAGGGCTGCAGAAATGTGTAAGAATGTATAACCCAACAAACATTTTAGATGTGAAACAAGGACCAAAAGAGCCATTTCAAAGCTACGTAGATAGATTCTACAAAAGTCTAAGAGCAGAGCAAACAGACCCGGCAGTAAAGAATTGGATGACCCAAACACTGCTGATTCAAAATGCTAACCCAGATTGTAAATTGGTGCTCAAGGGTCTGGGTATGAATCCCACTTTAGAAGAAATGCTGACAGCCTGTCAGGGAATAGGAGGGCCAGGACAAAAAGCTAGATTAATGGCAGAAGCATTGAAAGAGGCACTGAGACCAGACCAACTCCCATTTGCAGCAGTCCAACAGAAAGGACAAAGGAGGACAATCAAGTGTTGGAATTGTGGAAAGGAGGGACACTCTGCAAGACAATGCAGGGCCCCTAGAAGACAGGGCTGCTGGGGGTGCGGAAAAACGGGTCATGTTATGGCCAAATGCCCTGAAAGACAGGCGGGTTTTTTAGGGTTTGGCCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCCCAGATGCCTCAGGGGCTGACACCAACTGCTCCCCCAGAGGATCCAGCTGTGGATCTACTGAAGAATTACATGAAGATGGGCAGAAAGCAGAGGGAGAACAGAGAGAGACCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGAAGACCAGTAGTCACTGCCTACATTGAAGAACAGCCCGTAGAAGTATTATTAGATACAGGGGCTGATGATTCAATTGTAACAGGGATAGAATTGGGTCCAAATTATACCCCTAAAATAGTAGGAGGAATAGGAGGCTTCATTAATACCAAAGAATATAAAGATGTGAAAATAAAAGTCTTAGGCAAGGTAATTAAGGGAACAATTATGACGGGAGATACCCCAATTAATATTTTTGGCAGAAATTTGCTAACAGCTATGGGCATGTCTTTAAATTTCCCCATAGCTAAGGTGGAGCCTATAAAAGTAACACTAAAACCAGGGAAAGAAGGACCAAAATTGAGACAGTGGCCGCTATCAAAAGAAAAGATAATTGCATTAAGAGAAATCTGTGAAAAAATGGAAAAAGATGGCCAGTTAGAGGAAGCCCCTCCAACCAATCCGTATAACACCCCCACTTTTGCTATAAAGAAGAAAGACAAAAATAAATGGAGAATGCTAATAGATTTTAGAGAATTAAATAAGGTCACTCAAGACTTTACAGAAGTACAGTTAGGAATACCACACCCTGCAGGACTAGCAAAGAGAAGGAGGATCACAGTATTGGATGTAGGTGATGCATATTTCTCCATTCCTCTAGATGAAGAATTCAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAACCAGGAAAAAGATACATCTATAAGGTATTACCTCAAGGGTGGAAGGGGTCACCAGCTATTTTTCAGTATACTATGAGAAATGTATTAGAACCTTTCAGAAAAGCAAATCCAGATGTGACCCTGATCCAATACATGGATGACATCTTAATAGCTAGTGATAGAACAGATTTAGAGCATGACAGGGTAGTTTTACAGTTAAAGGAACTTCTGAACGGCATAGGATTCTCCACCCCAGAAGAGAAGTTCCAGAAAGATCCCCCATTCCAGTGGATGGGATATGAATTGTGGCCAACCAAATGGAAACTGCAGAAAATAGAGTTGCCACAAAGAGAGACCTGGACAGTAAATGACATACAAAAATTAGTAGGAGTGCTAAATTGGGCAGCACAAATTTATCCAGGAATAAAGACTAAACATCTTTGCAGACTAATCAGAGGAAAAATGACTTTAACAGAAGAGGTTCAGTGGACTGAGATGGCAGAGGCAGAATATGAAGAAAACAAGATAATTCTCAGTCAAGAACAAGAAGGATGTTACTACCAAGAGGGAAAACCAATAGAGGCAACAGTAATAAAGAGTCAGGATAATCAGTGGTCATATAAAATTCACCAAGAAGACAAAGTACTAAAAGTGGGCAAATTTGCAAAGGTTAAAAATACACATACAAATGGAGTCAGATTACTAGCACATGTAGTGCAGAAAATAGGAAAGGAGGCACTAGTAATTTGGGGAGAGGTGCCAAAATTCCATTTGCCAGTAGAAAGAGAAATTTGGGAACAATGGTGGACAGATTATTGGCAAGTAACCTGGATACCAGATTGGGACTTTGTGTCAACACCTCCCTTAGTCAGATTAGTCTTCAACCTAGTAAAAGAGCCTATACAGGGAGCAGAAACATTTTACGTAGATGGATCCTGTAATAGGCAGTCAAGAGAAGGAAAAGCAGGCTATGTGACGGATAGGGGCAGAGACAAAGCAAAACTTTTAGAACAGACTACCAACCAACAAGCAGAGTTGGAAGCCTTCTATCTAGCCTTAGCAGATTCGGGACCAAAAGCAAATATTATAGTAGATTCCCAATATGTTATGGGCATAGTAGCAGGTCAGCCCACTGAATCAGAAAGTAGGTTAGTAAACCAGATAATAGAAGAGATGATTAAAAAGGAAGCAATTTATGTAGCATGGGTACCTGCACATAAAGGAATAGGAGGAAATCAAGAAGTAGATCACCTGGTTAGCCAGGGAATTAGACAAGTCCTATTCTTAGAAAAAATAGAACCAGCACAAGAAGAGCATGAAAAGTACCATAGCAATGTAAAAGAATTGGTATTCAAATTTGGTATACCTAGGCTAGTAGCAAAACAGATAGTAGACACATGTGATAGATGCCACCAGAAAGGAGAAGCCATACATGGGCAAGTAAATGCAGAACTAGGGACTTGGCAAATGGACTGTACGCACCTAGAAGGCAAAATAATTATAGTTGCAGTACATGTGGCTAGTGGATTTATAGAGGCAGAAGTAATCCCGCAGGAAACAGGAAGACAAACAGCACTGTTTCTGTTAAAGCTAGCTGGCAGATGGCCCATCACACATCTGCATACTGATAATGGTGCCAATTTCACATCACAAGAAGTGAAAATGGTTGCCTGGTGGGCAGGGATTGAACAGACCTTTGGAGTGCCTTATAATCCACAGAGCCAAGGAGTAGTGGAAGCAATGAACCATCATTTAAAAACCCAGATAGATAGAATTAGAGAACAAGCAAACTCAGTAGAGACTATAGTACTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAGTCAATATGATCACCACAGAACAAGAAATACAATTCCAACAATCAAAAAATTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGACCAGCTGTGGAGAGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCCTAAAGGTAGGGACAGAGATTAAGGTAGTACCAAGGAGGAAAGCTAAAATTATCAAAGACTATGGAGGAGGAAAAGAATTGGATAGTGGTTCCCACTTGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATCAAACACCTGAAATATAACACTAAGGACCTACAGATGGCTTGCTATGTGCCCCATCATAAAGTTGGATGGGCATGGTGGACTTGCAGCAGAGTAATTTTCCCATTAAGGGATAAGACTCATTTGGAAGTACAAGGATATTGGAATTTGACACCAGAAAAAGGATGGCTCAGTACTCATGCAGTAAGAATAACCTGGTACTCCAGAAATTTCTGGACAGATGTAACACCAGATTGTGCAGACACTTTACTGCATAGCACTTATTTCCCTTGCTTTTCAGAGGGAGAAGTACAAAGAGCCATCAGGGGAGAGAAATTGCTGTCTTGCTGCAAGTTCCCGAAAGCTCATAAAAATCAGGTACCAAGCCTACAGTATCTAGCACTAACAGTAGTAAGTCATGTCAGATCCCAGAGAGAGGATCCCACCTGGAAACAGTGGAGAGGAAACAATAGAAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAAGGAATAAACAGGGCAGCAGTAAATCACCTGCCGAGGGAGCTAATTTTCCAGGTTTGGCAAAGGTCCTGGGAATACTGGCATGATGAAATGGGAATGTCAGAAAGCTACACAAAATATAGATACTTGTGCTTGATACAGAAAGCTCTGTTTATGCATTGCAAGAAAGGGTGTAGGTGCTTAGGAGAAGGGCATGGGGCAGGGGGATGGAGAACAGGGCCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAAATGGCAGAAAGACCTCCAGAAGATGAAGCCCCACAGAGGGAACCATGGGATGAATGGGTAGTGGAAGTTCTGGAGGAAATAAAAGAAGAAGCCCTGAAACATTTTGATCCTCGCTTGCTAACTGCGCTTGGTAACTATATTTATGATAGACATGGAGACACCCTTGAAGGAGCAGGAGAACTCATTAGAATCCTACAGAGAGCACTCTTCATCCATTTCAGAAGTGGATGTGCCCACTCCAGAATCGGCCAATCTAGAGGAGGAAATCCTCTCTCAACTATACCGCCCTCTAGAGCCATGCTATAACAAGTGCTACTGTAAGAGGTGTTGCTATCATTGTCAGCATTGTTTTCTTAAAAAGGGTTTGGGAATATGCTATGAGCAGCACCGAAGAAGAACTCCGAAAAAGACTAAGACTAATCCACTTCCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCGCTCTTGCTAGTAAGTGTTTTAGAGATTTGTTGTGTTCAATATGTAACAGTATTCTATGGTGTACCAGCATGGAAGAATGCGACAATTCCCCTCTTCTGTGCAACCAGGAATAGGGACACTTGGGGAACAACACAATGCTTGCCTGATAATGATGATTACTCAGAATTGGCAGTCAATATCACAGAGGCTTTTGATGCTTGGAATAATACAGTCACAGAACAAGCAATAGAGGATGTGTGGAACCTCTTTGAAACATCCATTAAGCCCTGTGTAAAACTTACCCCACTATGTATAGCAATGAGATGTAATAAAACTGAGACAGATAGGTGGGGTTTGACAGGAAGAGCAGAGACAACAACAACAGCGAAATCAACAACATCAACAACAACAACAACAGTAACACCAAAGGTTATAAATGAAGGTGATTCTTGCATAAAAAATAATAGTTGTGCAGGCTTGGAACAGGAGCCCATGATAGGTTGTAAATTTAACATGACAGGGTTAAAGAGGGACAAAAAGATAGAATATAATGAAACATGGTATTCAAGAGATTTAATCTGTGAGCAGCCAGCAAATGGAAGTGAGAGTAAATGTTACATGCAGCATTGTAACACCAGTGTTATTCAGGAATCCTGTGACAAGCATTATTGGGATGCTATTAGATTTAGATACTGTGCACCGCCAGGTTATGCTTTGCTTAGGTGTAATGATTCAAATTATTCAGGCTTTGCTCCTAAATGTTCTAAGGTAGTGGTTTCTTCATGCACAAGAATGATGGAGACGCAAACCTCTACTTGGTTTGGCTTCAATGGTACTAGGGCAGAAAATAGAACATACATTTATTGGCATGGCAATAGTAATAGAACCATAATTAGCTTAAATAAGTATTATAATCTAACAATGAAATGTAGAAGACCAGGAAATAAGACAGTTTTACCAGTCACCATTATGTCAGGGTTGGTCTTCCATTCGCAACCCATAAATGAGAGACCAAAACAGGCCTGGTGCCGGTTTGGAGGAAACTGGAGCGAGGCCATCCAGGAAGTGAAGGAAACCTTGGTCAAACATCCCAGGTATACGGGAACTAATGATACTAGGAAAATTAATCTAACAGCTCCAGCAGGAGGAGATCCAGAAGTCACTTTTATGTGGACAAATTGTCGAGGAGAATTCTTATACTGCAAAATGAATTGGTTTCTCAATTGGGTAGAGGACAGAGACCAAAATAGTAACAGATGGAAACAACAAAAGAAGCCAGAGCAACAGAAGAGAAATTATGTGCCATGTCATATTAGACAAATAATCAACACGTGGCACAAAGTAGGCAAAAATGTATATTTGCCTCCTAGGGAAGGAGACCTGACATGTAATTCCACTGTAACTAGTCTCATAGCAGAGATAGATTGGATCAATAACAATGAGACCAATATCACCATGAGTGCAGAGGTGGCAGAACTGTATCGATTGGAGTTGGGAGATTACAAATTAGTAGAGATTACTCCAATTGGCTTGGCCCCCACAGATGTAAGAAGGTACACCACAACTGGTGCCTCAAGAAATAAGAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCGACAGCAGGTTCTGCAATGGGCGCGGCGTCGCTGACGCTGTCGGCTCAGTCCCGGACTTTGTTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGATGTGGTCAAGAGACAACATGAATTGTTGCGACTGACCGTCTGGGGAACTAAGAACCTCCAGACTAGAGTCACTGCTATCGAGAAGTACCTGAAGGATCAGGCGCAGCTAAATTCATGGGGATGTGCTTTTAGGCAAGTCTGTCACACTACTGTACCATGGCCAAATGACTCATTGGTGCCTAATTGGGACAATATGACTTGGCAAGAGTGGGAAGGAAAGGTTGACTTCCTAGAGGCAAATATAACTCAATTATTAGAAGAAGCACAAATTCAGCAAGAAAAGAATATGTATGAATTGCAAAAACTAAATAGCTGGGATATCTTTGGCAATTGGTTTGACCTTACTTCTTGGATAAGATATATACAATATGGTGTACTAATAGTTTTAGGAGTAGTAGGGTTAAGAATAGTAATATATGTAGTGCAAATGCTAGCTAGGTTAAGACAGGGTTATAGGCCAGTGTTCTCTCCCCCTCCCGCTTATGTTCAGCAGATCCCTATCCACAAGGACCAGGAACCGCCAACCAAAGAAGGAGAAGAAGGAGAAGGTGGAGACAGAGGTGGCAGCAGATCTTGGCCTTGGCAGATAGAATATATTCATTTCCTAATCCGCCAACTGATACGCCTCTTGACTTGGCTATTCAGCAGCTGCAGGGATTGGCTATTGAGGATCTACCAGATCCTCCAACCAGTGCTCCAGAGACTCTCAAGGACGCTGCAAAGAGTTCGTGAAGTCATCAGAATTGAAATAACCTACCTACAATATGGGTGGAGCTATTTCCAAGAAGCAGCACAGGCGTGGTGGAAATTTGCGCGAGAGACTCTTGCGAGCGCGTGGAGAGACATATGGGAGACTCTGGGAAGGGTTGGAAGAGGGATACTCGCAATCCCTAGGCGCGTCAGGCAAGGGCTTGAGCTCGCTCTCTTGTGAGCCTCAGAAATATAGTGAGGGACAATATATGAATACCCCCTGGAGGAACCCAACAGCAGAAAAAGCAAAATTAGGTTATAAACAACAAAACATGGATGATGTGGATGATGAAGATGATGACTTAGTAGGTGTCTCAGTGCACCCAAAAGTCCCCTTAAGGGCCATGACATACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAATGAGAAAAGACATAGAATATTAGATATGTACATGGAAAAGGAAGAAGGAATAATACCAGATTGGCAAAATTACACATTAGGGCCAGGAACTAGATACCCTATGTACTTTGGGTGGCTCTGGAAATTAGTCCCAGTAGATGTCTCAGATGAAGCCCAGGAAGACGAGACACATTGCCTGGTGCATCCAGCACAGACTCATCAGTGGGATGACCCCTGGGGAGAGGTACTGGCATGGAAGTTTGATCCAGAATTGGCTTATAGCTATAAGGCATTTATTAAGTACCCAGAAGAGTTTGGTAGTAAGTCAGGCTTGTCAGAGGAAGAGGTAAAGAGAAGGCTAACCGCAAGAGGCATTTATAAAATGGCTGACAAGAGGGAAACAAGCTGAGACAGCAGGGACTTTCCACAAGGGACTTTCCACAAGGGGCTGTCATGGGGAGGTACTGGGGAGGAGCTGGCTGGAACGCCCACTTATTCTCTGTATAAATACAACTGCATTTCGCTCTGTAGTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGGCTCCACGCTTGCTTGCTTAAAGACCTCTTCAATAAAGCTGCCATTTAGAAGTAAGCAAGTGTGTGTTCCCATCTCTCCTAGTCGCCGCCTGGTCATCTCGGTACTCGACACATAAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAGGCAGGAAAATCCCTAGCA'),
('SIVsmE041-2', 'Virus', 'SIVsmE041-2', 'RNA', 'SIV', 'ACAGGGACTTGAAGGAGAGTGAGAGCTCCTGAGTACGGCTGAGTGAAGGCAGYAAGGGCGGCAGGAAYAAACCACGACGGAGTGCTCCTATAAAGGCGCGGGCCGGTACCAGGCGGCGTGAGGAGCGGGAGTCGGAGAGGCCTCCGGTTGCAGGTAAGTGCAACAAAAGAGTCATAGGACTGAGTTCCCTACTTTTGAGRAAAGAGTAGGAGAGTGGGAGATGGGCGCGAGAARCTCCGTCTTGTCAGGGAAAAAAGCAGATGAATTAGAAAAAATTAGGTTACGGCCCGGCGGAAAGAAAAAGTACATGCTGAAGCATGTAGTGTGGGCAGCAAACGAATTGGACARATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGTTGTCAAARAATTCTTTCAGTYTTAGCTCCATTAGTTCCGACAGGTTCAGAAAATTTAAAGAGCCTYTATAATACTGTCTGCGTCATTTGGTGCATTCACGCAGAAGAGAAAGTGAAACATACTGAGGAAGCAAAACAAATAGTGCAGAGACATCTAGTGGTGGAAACAGGAACAGCAGACAAAATGCCAGCAACAAGTAGACCAACAGCACCACCTAGTGGCAGAGGAGGAAATTACCCAGTGCAGCAAGTAGGTGGCAATTATACCCACCTACCCTTAAGTCCAAGAACATTAAATGCTTGGGTAAAATTGRTAGAAGAGAAAAAATTTGGGGCAGAAGTAGTGCCAGGATTTCARGCACTATCAGAAGGCTGCACYCCCTATGACATCAATCAGATGCTAAATTGTGTRGGGGAACAYCAATCAGCCATGCAAATTATTAGAGAAATTATAAATGAAGAAGCTGCTGATTGGGATTTACAACACCCGCAGCCAGGTCCAATACCAGCAGGACARCTTAGAGATCCGAGAGGATCAGACATTGCAGGAACTACTAGCACAGTAGAAGAACAAATTCAATGGATGTATAGGCAGCAAAACCCTATACCAGTAGGTAACATTTACAGAAGGTGGATCCAATTAGGGCTGCAAAAATGTGTAAGGATGTATAATCCAACAAACATTTTAGATGTGAAACARGGACCRAAAGAGCCATTTCAAAGCTATGTAGATAGATTCTACAAGAGTCTAAGAGCAGAACAAACAGACCCAGCAGTGAAAAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCGGATTGCAAATTGGTGCTCAAGGGTCTGGGTATGAATCCCACTTTAGAAGAAATGCTGACAGCCTGTCAGGGARTAGGAGGACCAGGACAAAAAGCTAGACTAATGGCAGAAGCCTTGAAAGAGGCACTGACGCCAGGACAACTCCCATTTGCAGCAGTCCAACAGAGAGGACAAAGAAAGACAATTAAATGYTGGAATTGTGGAAAGGAGGGACACTCTGCGAGACAATGCAGAGCCCCTAGAAGACAGGGCTGCTGGAAGTGTGGARAAACAGGCCATGTTATGGCCAAATGCCCCGAGAGACAGGCGGGTTTTTTAGGGCTTGGCCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCCCAGATACCTCAGGGGTTGACACCAACTGCTCCCCCAGAGGATCCAGCTGTGGATCTACTGAAGAATTACATGAGGATGGGCAGAAGGCAGAGGGARAACAGAGAGAGACCTTACAAGGARGTGACGGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGAAGACCAGTAGTTACTGCCTACATTGAAGAACAGCCCGTAGAAGTATTATTAGATACAGGGGCTGATGATTCAATYGTAGCAGGGATAGAATTGGGTCCAAATTATACCCCTAAAATAGTAGGAGGRATAGGAGGTTTCATTAACACCAAGGAATATAAAGATGTAAAAATAAAAGTCTTAGGCAARGTAATTAAGGGAACAATTATGACAGGAGATACCCCAATTAACATTTTTGGCAGAAATCTGCTAACAGCTATGGGCATGTCTCTAAATCTCCCCATAGCTAAGGTGGAACCTATCAAAGTAACACTAAAACCAGGAAAAGATGGACCAAAATTAAGACAGTGGCCGCTATCAAAAGAAAAGATAATTGCATTAAGRGAGATCTGTGAAAAAATGGAAAAAGATGGCCAGTTAGAGGAAGCCCCTCCAACCAATCCATATAACACCCCCACATTTGCTATAAAGAAGAAAGACAAAAATAAATGGAGGATGCTAATAGACTTTAGAGAATTAAACAAGGTTACTCAAGATTTTACAGAAGTACAGYTAGGAATACCACACCCTGCAGGACTAGCAAAGAGAAGAAGGATCACAGTATTGGATGTAGGTGATGCATATTTCTCCATACCTTTAGATGAGGAATTCAGGCAATACACTGCCTTTACTTTACCATCAGTAAACAATGCAGAACCAGGAAAAAGATACATCTATAAGGTAYTACCTCAAGGGTGGAAAGGATCACCAGCTATTTTTCAGCATACYATGAGAAATGTCTTAGAACCTTTCAGAAAAGCAAATCCAGATGTGACMCTGATCCAATACATGGATGAYATCCTAATAGCTAGTGAYAGAACAGATTTAGAACATGACAGGGTAGTTTTACAGTTAAAGGAACTTCTAAACAGTATGGGATTTTCCACCCCAGAAGAGAAGTTCCAGAAAGATCCCCCATTCCAGTGGATGGGATATGAATTGTGGCCAACCAAATGGAAACTGCAAAAAATAGAGTTGCCACAAAGAGAAACCTGGACAGTAAATGATATACAAAARTTAGTAGGAGTGCTAAATTGGGCAGCACAAATTTATCCAGGAATAAAGACTAAACACCTTTGCAGATTAATCAGAGGAAAAATGACTTTAACAGAAGAGGTTCAGTGGACTGAGATGGCAGAGGCAGAATATGAAGAAAAYAAGATAATTCTCAGTCAAGAACAAGAAGGGTGTTACTATCAAGAGGGAAAGCCACTGGAGGCAACAGTAATAAAGAGTCAGGATAATCAATGGTCATATAAAATTCACCAAGAAGACAAAATACTAAAAGTAGGCAAATTTGCAAAGATTAAGAATACACATACAAATGGAGTCAGATTATTAGCACAYGTAGTACAGAAAATAGGAAAAGAAGCAATAGTAATCTGGGGACAGGTGCCAAAATTTCATTTGCCAGTAGAGAGAGAAATCTGGGAACAATGGTGGACAGATTATTGGCAAGTAACCTGGATACCAGAATGGGACTTTGTATCAACACCTCCCTTAGTCAGAYTAGTCTTCAACCTAGTAAAAGAACCTATACAGGGAGCAGAAACATTTTATGTAGATGGATCCTGTAACAGACAGTCAAAAGAAGGAAAGGCAGGCTATGTGACAGACAGAGGYAGAGACAGAACAAAACYGCTGGAGCAGACTACCAATCAACAAGCGGARTTGGAAGCCTTCTATCTAGCCTTAGCAGATTCAGGACCARAAGCAAATATAATAGTRGATTCCCAATATGTTATGGGCATAATAGCGGGTCAACCCACKGAATCAGAAAGTAGATTAGTAAATCAGATAATAGAGGAAATGATTAAAAAGGAAGCAATTTATGTAGCRTGGGTACCTGCACATAAAGGAATAGGAGGAAATCAAGAAGTAGATCATCTGGTWAGTCAAGGAATTAGACAAGTCCTATTCTTAGAAAAAATAGAACCAGCGCAAGAAGAGCATGAGAAGTACCATAGCAATGTAAAAGARTTAGTATTCAAATTTGGCTTACCTAGGCTAGTAGCAAAACAGATAGTAGACACATGTGATAAATGTCATCAGAAAGGAGAAGCCATACATGGACAGGTAAATGCAGAATTAGGGACTTGGCAAATGGACTGTACACATCTAGAGGGCAAAATAATTATAGTTGCAGTACATGTGGCTAGTGGATTCATAGAGGCAGAAGTAATCCCGCAGGAAACAGGAAGACAAACAGCACTGTTTCTGCTAAAATTAGCCAGCAGATGGCCCATCACACATCTGCATACTGATAATGGTGCCAATTTCACATCGCAAGAAGTGAAAATGGTTGCTTGGTGGGCAGRGATTGAACAGACCTTTGGGGTACCTTATAATCCACAGAGCCARGGAGTAGTGGAAGCAATGAACCATCATCTAAAAACCCAGATAGATAGGATTAGGGAACAGGCAAATTCAATAGAGACTATAGTACTAATGGCAGYTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAGTCAATATGATCACCACAGAACAAGAAATACAATTCCAACAATCAAAAAATTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAGCTGTGGAAAGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCCTAAAGGTAGGGACAGAAATCAAGGTAGTACCAAGGAGGAAAGCTAAAATTATCAAAGACTATGGAGGAGGAAAAGAGTTGGATAGCGGTTCCMACTTGGAGGATACCGGGGAGGCTAGAGAAGTGGCATAGCCTCATCAAACACCTGAAATATAACACTAAAGACCTACAGAAGGCTTGTTATGTACCCCATCATAAAGTTGGATGGGCATGGTGGACTTGCAGCAGGGTAATCTTCCCATTAAGGGATGAGTCTCATTTGGAAGTACAAGGATATTGGAGTTTGACACCAGAGAARGGRTGGCTCAGTACTTATGCAGTRAGRATAACCTGGTACTCCAGAAATTTCTGGACAGATGTAACACCAGATTAYGCAGACACTTTACTGCATGGCACTTATTTCCCTTGCTTTTCAGAGGGAGAAGTACGAAGGGCCATCAGGGGAGAGAAATTGCTGTCTTGCTGCAAGTTCCCGAAAGCTCATAAGAATCAGGTACCAAGCCTACAGTATCTAGCACTAACAGTAGTGAGTCATGTCAGATCCCAGGGAGAGGATCCCACCTGGAAACAGTGGAGAGGAAACAGTAGGCGAGGCCTTCGACTGGCTAGAAAGAACAGTAGAAGAAATAAACAGGGCAGCAGTGAATCATTTGCCGAGGGAGTTAATTTTCCAGGTTTGGCGAAGGTCCTGGGAATACTGGCATGATGAAATAGGGATGTCAGCTAGTTACACAAAATACAGATACTTGTGCTTGATACAAAAAGCTTTGTTTATGCATTGCAAGAAAGGGTGTAGGTGCTTAGGAGGAGAGCATGGGGCAGGGGGATGGAGATCAGGGCCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAAATGACAGAAAGACCTCCAGAAGATGAAGCCCCACAGAGGGAACCGTGGGATGAATGGGTAGTAGAAGTTCTGGAGGAAGTAAAAGAAGAAGCCCTGAAACATTTTGATCCTCGCTTGCTAACTGCGCTTGGTAACTATATCTATGATAGACATGGAGACACCCTTGAAGGAGCAGGAGAGCTCATTAGAATCCTCCAGAGAGCACTCTTCATCCATTTCAGAGGTGGATGCAACCACTCCAGAATCGGCCACTCTGGAGGAGGAAATCCTCTCTCAACTATACCGCCCTCTAGAGGCGTGCTATAACAAGTGCTACTGTAAGAAGTGTTGCTATCATTGTCAGCATTGTTTTCTTAAAAAGGGTTTGGGARTATGCTATGAGCAGCAACGAAGAAGAACTCCGAAGAAGACTAAGGCTAATACATTTTCTGCATCAAACAAGTAAGTATGGGATGTCTTGGGAATCAGCTGCTTATCGCGCTCTTGCTATTAAGTGCTTTAGGGATTTCTTGTGTTCAATATGTGACAGTGTTCTATGGTATACCAGCATGGAAGAATGCGACAGTTCCCCTCTTCTGTGCAACTGAGAATAGGGACACTTGGGGAACAACACAATGCTTGCCAGATAATAATGATTACTCAGAATTGGCAATTAATGTCACAGAGGCTTTTGATGCTTGGGATAATACAGTCACAGAACAAGCAATAGAGGATGTGTGGAACCTCTTTGAAACATCCATTAAGCCCTGTGTAAAACTCACCCCCCTATGTATAGCAATGAGGTGTAATAAAACTGAGACAGATAGATGGGGCCTAACAGGAAAACCAGTAACAACGACAACATCAACAACAACAAAATCAACATCAAAACCACCAGCATTAACAGCAAAGGTTATAAATGAAAATGATCCATGTATAARAACTGATAATTGTGCAGGCTTGGAACAGGAGCCCATGATAAGTTGTAAATTTAACATGACAGGGTTAAKAAGGGACAAAAAGAAAGAATATAATGAAACATGGTATTCAAGAGATATAGTTTGTGAACAAAATAACAATGGAAATGAAAATGAAAGTAAATGCTATATGAACCATTGTAACACTAGTGTTATTCAAGAATCCTGTGACAAGCATTATTGGGATGCTATTAGATTTAGATATTGTGCTCCGCCAGGTTATGCTTTGCTTAGGTGTAATGATTCAAATTATTCAGGCTTTGAACCTAACTGTACTAAGGTAGTAGTTTCTTCATGCACAAGAATGATGGAAACACAAACCTCTACTTGGTTTGGTTTCAATGGTACTAGAGCAGAAAATAGAACATACATTTATTGGCATGGCAGAAGCAATAGAACCATAATTAGCTTAAATAAGTATTATAATCTAACAATGAGCTGTAGGAGACCAGGAAAAAAGATAGTCTTACCAGTCACCATTACGTCAGGGTTGATCTTCCATTCGCAAACCATAAATAAGAGGCCAAAACAGGCCTGGTGCTGGTTTRGRGGARAYTGGAAAGGGGCYATCCGAGAAGTGAAGGAAACCTTGGTCAAACATCCCAGGTATACGGGAACTAATGATACTRAGMARATTAATCTAACAGCTCCAGSAGGAGGAGATCCRGAAGTTACTTTCATGTGGACAAATTGTCGAGGAGAATTCTTATATTGCAAAATGAATTGGTTTCTTAATTGGGTAGATGAGACAAATGGTTTTAGATGGNNNNNNCAAAAMCMGAAGGAGAAGAAAAGGAGGAATTATGTGCCATGTCATATTAGACAGGTAATCAAYACGTGGCACAGRGTAGGCAAAAATGTGTATTTGCCTCCTAGGGAAGGAGAYYTGACATGTAATTCCACTGTAACTAGCCTCATAGCAGAAATAGATTGGATCGATAAAAATGAGACCAATATCACCATGAGTGCAGAGGTGGCAGAGCTGTATCGATTGGAGTTGGGAGATTACAAATTAGTAGAGATTACTCCAATTGGCTTGGCCCCCACAAGTGTRAGAAGGTACACCACAACCGGTGCCTCAAGAAATAAAAGAGGGGTCTTTGTGCTAGGGTTCTTGGGTTTTCTCGCRACAGCAGGTTCTGCAATGGGCGCGGCGTCGCTGACGCTGTCGGCTCAGTCCCGGACTTTGTTGGCTGGGATAGTGCAGCAACAGCAACAGCTGTTGGATGTGGTCAAGAGACAACAAGAATTGTTGCGACTGACCGTCTGGGGAACTAAGAACCTCCAGACTAGAGTCACTGCTATCGAGAAGTACCTAAAGGATCAGGCGCATCTAAATTCATGGGGATGTGCTTTTAGGCAGGTCTGCCACACTACTGTACCATGGCCAAATGACACATTGATGCCTAATTGGGACAATATGACTTGGCAAGAGTGGGAAAGACAGGTTGACTTCCTAGAGGCAAATATAACTCAATTACTGGAAGAAGCACAAATTCAGCAAGAAGAGAACATGTATGAGTTGCAAAAATTAAATAGCTGGGATATCTTTGGCAATTGGTTTGACCTTACTTCTTGGATAAAATATATACAATATGGTGTACTTATAGTTTTAGGAGTAATAGGATTAAGAATAGTAATATATGTAGTGCAGATGTTAGCTAGGTTAAGACAGGGTTATAGGCCAGTGTTCTCTTCCCCTCCCGTTTATGTTCAGCAGATCCCTATCCAGAAGGGCCAGGAACCGCCAACCAAAGAAGGAGAAGAAGAAGACGGTGGAGGCAGAGGTGGCAACAGATCTTGGCCTTGGCAGATAGAATATATTCATTTCCTGATCCGCCAGCTAATACGCCTCTTGACTTGGCTATTCAACAGTTGCAGAGATTGGCTATTGAGGAGCTGCCAAATCCTCCAGCCAGTGCTCCAGAGCCTCTCAAGGACATTGCAGAGAGTCCGTGAAGTCATCAGGGTAGAGATAGCCTACCTACAGTATGGGTGGCGTTACTTCCAAGAAGCAGCGCAAGCATGGTGGAAATTTGCGCGAGAGACTCTTGCAAGCGCGTGGAGAGACTTATGGGAGACTCTGGGACGGGTTGGAAGGGGAATACTCGCAATCCCAAGACGTATCAGGCAAGGGCTTGAGCTCACTCTCTTGTGAGCCTCNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNAGGAACCCAACAGCAGAAAGAGCAAAATTAGATTATAGACAACAAAACATGGATGATGTGGATGATGATGANNNARTAGGYTTTCCAGTGACCCCAAGAGTCCCCTTAAGGACTATGACATACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGATAGGAGACATAGAATATTGAATCTGTACTTAGAAAAGGAAGAAGGAATAATACCAGATTGGCAAAATTACACAGCAGGGCCAGGAATCAGATACCCTATGTGCTTTGGATGGCTCTGGAAATTAGTCCCAGTAGATGTCTCAGATGAAGCTCAGGAGGACGAGGCACATTGCTTGATGCATCCAGCACAGACCTCTCAGTGGGATGACCCCTGGGGAGAGGTACTGGCATGGAAGTTTGATCCAGAGTTAGCTTATAACTATATGGCATTTGTTAAGCACCCAGAAGAGTTTGGTAGTAGATCAGGCTTGTCAGAGGAAGAGGTAAAGAGAAGGCTAACCGCAAGAGGCCTTTTAAAAATGGCTGACAAGAAGGAAACAAGCTGAGACAGCAGGGACTTTCCACAAAGGGGATGTTATGGGGAGGTACTGGGGAGGAACTGGCTGGAACGCCCACTTAT'),
('A_Kawasaki_173_2001_NA', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCAAAAGCAGGAGTTTAAAATGAATCCAAATCAAAAAATAATAACCATTGGATCAATCAGTATAGCAATCGGAATAATTAGCCTAATGTTGCAAATAGGAAACATTATTTCAATATGGGCTAGTCACTCAATCCAAACTGGAAGTCAAAACCACACTGGAGTATGCAACCAAAGAATCATCACATATGAAAACAGCACCTGGGTGAATCACACATATGTTAATATTAACAACACCAATGTTATTGCTGGAAAGGACAAAACTTCAGTGACATTGGCCGGCAATTCATCTCTTTGTTCTATCAGTGGATGGGCTATATACACAAAAGACAACAGCATAAGAATTGGTTCCAAAGGAGATGTTTTTGTCATAAGAGAGCCTTTCATATCATGTTCTCACTTGGAATGCAGAACCTTTTTTCTGACCCAAGGTGCTCTATTAAATGACAAACATTCAAATGGGACCGTTAAGGACAGAAGTCCCTATAGGGCTTTAATGAGCTGTCCTCTAGGTGAAGCTCCGTCCCCATACAATTCAAAGTTTGAATCAGTTGCTTGGTCAGCAAGCGCATGCCATGATGGCATGGGCTGGTTAACAATCGGAATTTCTGGTCCAGACAATGGAGCAGTGGCTGTACTAAAATACAACGGCATAATAACTGAAACCATAAAAAGTTGGAAAAAGCAAATATTAAGAACACAAGAGTCTGAATGTGTCTGTGTGAACGGGTCATGTTTCACCATAATGACCGATGGCCCGAGTAATGGGGCCGCCTCGTACAAAATCTTCAAGATCGAAAAGGGAAAGGTTACTAAATCAATAGAGTTGAATGCACCCAATTTTCATTATGAGGAATGTTCCTGTTACCCAGACACTGGCACAGTGATGTGTGTATGCAGGGACAACTGGCATGGTTCAAATCGACCCTGGGTGTCTTTTAATCAAAACCTGGATTATCAAATAGGATACATCTGCAGTGGGGTGTTCGGTGACAATCCGCGTCCCAAAGATGGAGAGGGCAGCTGTAATCCAGTGACTGTTGATGGAGCAAACGGAGTAAAGGGGTTTTCATACAAATATGGTAATGGTGTTTGGATAGGAAGGACTAAAAGTAACAGACTTAGAAAGGGGTTTGAGATGATTTGGGATCCTAATGGATGGACAGATACCGACAGTGATTTCTCAGTGAAACAGGATGTTGTGGCAATAACTGATTGGTCAGGGTACAGCGGAAGTTTCGTTCAACATCCTGAGTTAACAGGATTGGACTGTATAAGACCTTGCTTCTGGGTTGAGTTAGTCAGAGGACTGCCAAAAGAAAATACAACAATCTGGACTAGTGGGAGCAGCATTTCTTTTTGTGGCGTAAATAGTGATACTGCAAACTGGTCTTGGCCAGACGGTGCTGAGTTGCCGTTTACCATTGACAAGTAGTTCGTTGAAAAAACTCCTTGTTTCTACT'),
('A_Kawasaki_173_2001_M', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCAAAAGCAGGTAGATATTGAAAGATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATCCCTTCAGGCCCCCTCAAAGCCGAGATCGCACAGAGACTTGAAGATGTCTTTGCTGGAAAGAATACCGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCGATCCTGTCACCTCTGACTAAGGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTTAATGGGAATGGGGATCCAAATAATATGGACAGAGCAGTTAAACTGTATCGAAAGCTTAAGAGGGAGATAACATTCCATGGGGCCAAAGAAATAGCACTCAGTTATTCTGCTGGTGCACTTGCCAGTTGTATGGGACTCATATACAACAGGATGGGGGCTGTGACCACCGAATCAGCATTTGGCCTTATATGTGCAACCTGTGAACAGATTGCCGACTCCCAGCATAAGTCTCATAGGCAAATGGTAACAACAACCAATCCATTAATAAGACATGAGAACAGAATGGTTCTGGCCAGCACTACAGCTAAGGCTATGGAGCAAATGGCTGGATCGAGTGAACAAGCAGCTGAGGCCATGGGAGGTTGCTAGTCAGGCCAGGCAGATGGTGCAGGCAATGAGAGCCATTGGGACTCATCCTAGCTCTAGCACTGGTCTGAAAAATGATCTCCTTGAAAATTTGCAGGCCTATCAAAAACGAATGGGGGTGCAGATGCAACGATTCAAGTGATCCTCTTGTTGTTGCCGCAAGTATAATTGGGATTGTGCACCTGATATTGTGGATTATTGATCGCCTTTTTTCCAAAAGCATTTATCGTATCTTTAAACACGGTTTAAAAAGAGGGCCTTCTACGGAAGGAGTACCAGAGTCTATGAGGGAAGAATATCGAGAGGAACAGCAGAATGCTGTGGATGCTGACGATGGTCATTTTGTCAGCATAGAGCTGGAGTAAAAAACTACCTTGTTTCTACT'),
('A_Kawasaki_173_2001_NS', 'Virus', 'A_Kawasaki_173_2001', 'RNA', 'Influenza A', 'AGCAAAAGCAGGGTGGCAAAGACATAATGGATTCCCACACTGTGTCAAGCTTTCAGGTAGATTGCTTCCTTTGGCATGTCCGCAAACAAGTTGCAGACCAAGGTCTAGGCGATGCCCCCTTCCTTGATCGGCTTCGCCGAGATCAGAAGTCTCTAAAGGGAAGAGGCAGCACTCTCGGTCTGAACATCGAAACAGCCACTTGTGTTGGAAAGCAAATAGTAGAGAGGATTCTGAAAGAAGAATCCGATGAGGCATTTAAAATGACCATGGCCTCCGCACTTGCTTCGCGGTACCTAACTGACATGACTATTGAAGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAGAAAGTGGCTGGCCCTCTTTGTGTCAGAATGGACCAGGCGATAATGGATAAGAACATCATACTGAAAGCGAATTTCAGTGTGATTTTTGATCGGTTGGAGAATCTGACATTACTAAGGGCTTTCACCGAAGAGGGAGCAATTGTTGGCGAAATTTCACCATTGCCTTCTCTTCCAGGACATACTAATGAGGATGTCAAAAATGCAATTGGGGTCCTCATCGGGGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTCTACAGAGATTCGCTTGGAGAAGCAGTAATGAGACTGGGGGACCTCCATTCACTCCAACACAGAAACGGAAAATGGCGGGAACAATTAGGTCAGAAGTTTGAAGAAATAAGATGGCTGATTGAAGAAGTGAGGCATAAATTGAAGACGACAGAGAATAGTTTTGAGCAAATAACATTTATGCAAGCATTACAGCTATTGTTTGAGGTGGAACAAGAGATTAGAACGTTTTCGTTTCAGCTTATTTAATGATAAAAAACACCCTTGTTTCTACT'),
('A_Kawasaki_UTK-04_09_HA', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGAAAGTAAAACTACTGGTCCTGTTATGCACATTTACAGCTACATATGCAGACACAATATGTATAGGCTACCATGCTAACAACTCGACCGACACTGTTGACACAGTACTTGAAAAGAATGTGACAGTGACACACTCTGTCAACCTGCTTGAGAACAGTCACAATGGAAAACTATGTCTATTAAAAGGAATAGCCCCACTACAATTGGGTAACTGCAGCGTTGCCGGGTGGATCTTAGGAAACCCAGAATGCGAATTACTGATTTCCAAGGAGTCATGGTCCTACATTGTAGAAAAACCAAATCCTGAGAATGGAACATGTTACCCAGGACATTTCGCTGACTATGAGGAACTGAGGGAGCAATTGAGTTCAGTATCTTCATTTGAGAGGTTCGAAATATTCCCCAAAGAAAGCTCTTGGCCCAACCACACCGTAACCGGAGTGTCAGCATCATGCTCCCATAATGGGGAAAACAGTTTTTACAGAAATTTGCTATGGCTGACGGGGAAGAATGGTTTGTACCCAAACCTGAGCAAGTCCTATGCAAACAACAAAGAAAAAGAAGTCCTTGTACTATGGGGTGTTCATCACCCGCCAAACATAGCTGACCAAAAGACCCTCTATCATACAGAAAATGCTTATGTTTCTGTAGTGTCTTCACATTATAGCAGAAAATTCACCCCAGAAATAGCCAAAAGACCCAAAGTAAGAGATCAAGAAGGAAGAATCAACTACTACTGGACTCTGCTTGAACCCGGGGATACAATAATATTTGAGGCAAATGGAAATCTAATAGCGCCAAGATATGCTTTCGCACTGAGTAGAGGCTTTGGATCAGGAATCATCAACTCAAATGCACCAATGGATAAATGTGATGCGAAGTGCCAAACACCTCAAGGAGCTATAAACAGCAGTCTTCCTTTCCAGAACGTACACCCAGTCACAATAGGAGAGTGTCCAAAGTATGTCAGGAGTGCAAAATTAAGGATGGTTACAGGACTAAGGAACATCCCATCCATTCAATCCAGAGGTTTGTTTGGAGCCATTGCCGGTTTCATTGAAGGGGGGTGGACTGGAATGGTAGATGGTTGGTATGGTTATCATCATCAGAATGAGCAAGGATCTGGCTATGCTGCAGATCAAAAAAGCACACAAAATGCCATTAATGGGATTACAAACAAGGTGAATTCTGTAATTGAGAAAATGAACACTCAATTCACAGCAGTGGGCAAAGAATTCAACAAATTAGAAAGAAGGATGGAAAACTTGAATAAAAAAGTTGATGATGGATTTATAGACATTTGGACATATAATGCAGAACTGTTGGTTCTACTGGAAAATGAAAGGACTTTGGATTTCCATGACTCCAATGTGAAGAATCTGTATGAGAAAGTAAAAAGCCAGTTAAAGAATAATGCTAAAGAAATAGGAAATGGGTGTTTTGAATTCTATCACAAGTGTAACGATGAATGCATGGAGAGTGTAAAGAATGGAACTTATGACTATCCAAAATATTCCGAAGAATCAAAGTTAAACAGGGAGAAAATTGATGGAGTGAAATTGGAATCAATGGGAGTCTATCAGATTCTGGCGATCTACTCAACAGTCGCCAGTTCTCTGGTTCTTTTGGTCTCCCTGGGGGCAATCAGCTTCTGGATGTGTTCCAATGGGTCTTTGCAGTGTAGAATATGCATC'),
('A_Kawasaki_UTK-04_09_M', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTCTCTATCATCCCGTCAGGCCCCCTCAAAGCCGAGATCGCACAGAGACTTGAAGATGTATTTGCTGGAAAGAATACCGATCTTGAGGCTCTCATGGAGTGGTTAAAGACAAGACCAATCCTGTCACCTCTGACTAAGGGGATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTTAATGGGAATGGGGATCCAAATAATATGGACAGAGCAGTCAAACTTTATCGAAAGCTTAAGAGGGAGATAACATTCCATGGGGCCAAAGAAATAGCACTCAGTTATTCTGCTGGTGCACTTGCCAGTTGTATGGGACTCATATACAACAGGATGGGGGCTGTGACCACCGAATCAGCATTTGGCCTTATATGTGCAACCTGTGAACAGATTGCCGACTCCCAGCATAAGTCTCACAGGCAAATGGTAACAACAACCAATCCATTAATAAGACATGAGAACAGAATGGTTCTGGCCAGCACCACAGCTAAGGCTATGGAACAAATGGCTGGATCGAGCGAACAAGCAGCTGAGGCCATGGAGGTTGCTAGTCAGGCCAGGCAGATGGTGCAGGCAATGAGAGCCATTGGGACTCATCCTAGCTCTAGCACTGGTCTGAAAAATGATCTCCTTGAAAATTTACAGGCCTATCAGAAACGAATGGGGGTGCAGATGCAACGATTCAAGTGATCCTCTTGTTGTTGCCGCAAGTATAATTGGGATTGTGCACTTGATATTGTGGATTATTGATCGCCTTTTTTCCAAAAGCATTTATCGTATCTTTAAACACGGTTTAAAAAGAGGGCCTTCTACGGAAGGAGTACCAGAGTCTATGAGGGAAGAATATCGAGAGGAACAGCAGAATGCTGTGGATGCTGACGATGATCATTTTGTCAGCATAGAGCTGGAGTAAAAA'),
('A_Kawasaki_UTK-04_09_NA', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGAACCCAAATCAAAAGATAATAACCATTGGATCAATCAGTATAGCAATCGGAATAATTAGTCTAATGTTGCAAATAGGAAATATTATTTCAATATGGGCTAGTCACTCAATCCAAACTGGGAGTCAAAACAACACTGGAATATGCAACCAAAGAATCATCACATATGAAAACAGCACCTGGGTGAATCACACATATGTTAATATTAACAACACTAATGTTGTTGCTGGAGAGGACAAAACATCAGTGACATTGGCCGGCAATTCATCTCTTTGTTCTATCAGTGGATGGGCTATATACACAAAAGACAACAGCATAAGAATTGGCTCCAAAGGAGATGTTTTTGTCATAAGAGAACCTTTCATATCATGTTCTCACTTGGAATGCAGAACCTTTTTTCTGACCCAAGGCGCTCTATTAAATGACAAACATTCAAATGGGACCGCAAAGGACAGAAGTCCTTATAGGGCCTTAATGAGCTGTCCTCTAGGTGAAGCTCCGTCCCCATACAATTCAAAGTTCGAATCAGTTGCATGGTCAGCAAGCGCATGCCATGATGGCATGGGCTGGTTAACAATCGGAATTTCTGGTCCAGACAATGGAGCTGTGGCTGTACTAAAATACAACGGAATAATAACTGGAACCATAAAAAGTTGGAAAAAGCAAATATTAAGAACACAAGAGTCTGAATGTGTCTGTATGAACGGGTCATGTTTCACCATAATGACCGATGGCCCGAGTAATAAGGCCGCCTCGTACAAAATTTTCAAGATCGAAAAGGGGAAGGTTACTAAATCAATAGAGTTGAATGCACCCAATTTTTATTATGAGGAATGCTCCTGTTACCCAGATACTGGCATAGTGATGTGTGTATGCAGGGACAACTGGCATGGTTCAAATCGACCTTGGGTGTCTTTTAATCAAAACTTGGATTATCAAATAGGATACATCTGCAGTGGAGTGTTTGGTGACAATCCGCGTCCCGAAGATGGAGAGGGCAGCTGCAATCCAGTGACTGTTGATGGAGCAAACGGAGTAAAAGGGTTTTCATACAAATATGGTAATGGTGTTTGGATAGGGAGGACCAAAAGTAACAGACTTAGAAAGGGGTTTGAGATGATTTGGGATCCTAATGGATGGACAAATACCGACAGTGATTTCTCAGTGAAACAGGATGTTGTAGCAATAACTGATTGGTCAGGGTACAGCGGAAGTTTCGTCCAACATCCTGAGTTAACAGGATTGGGCTGTATAAGACCTTGCTTCTGGGTTGAGTTAGTCAGAGGGCTGCCTAGAGAAAATACAACAATCTGGACTAGTGGGAGCAGCATTTCTTTTTGTGGCGTTAATAGTGATACTGCAAACTGGTCTTGGCCAGACGGTGCTGAGTTGCCGTTCACCATTGACAAG'),
('A_Kawasaki_UTK-04_09_NP', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGGCGTCCCAAGGCACCAAACGGTCTTACGAACAGATGGAGACTGATGGGGAACGCCAGAATGCAACTGAAATCAGAGCATCCGTCGGAAGAATGATTGGTGGAATTGGGCGATTCTACATCCAAATGTGCACCGAGCTTAAGCTCAATGATTATGAGGGACGGCTGATCCAGAACAGCTTAACAATAGAGAGAATGGTGCTCTCTGCTTTTGATGAGAGGAGAAATAAATATCTAGAGGAACATCCCAGCGCGGGGAAAGATCCTAAGAAAACTGGAGGACCCATATACAAGAGAGTAGATGGAAAGTGGGTGAGGGAACTCGTCCTTTATGACAAAGAAGAAATAAGGCGGATTTGGCGCCAAGCCAACAATGGTGATGATGCAACGGCTGGTTTGACTCACATTATGATCTGGCATTCTAATTTGAATGATACAACTTACCAGAGGACAAGAGCTCTTGTCCGCACCGGAATGGATCCCAGGATGTGCTCTTTGATGCAAGGTTCAACTCTCCCTAGAAGATCTGGAGCAGCAGGCGCCGCAGTCAAAGGAGTTGGGACAATGGTATTGGAATTAATCAGGATGATCAAACGTGGGATCAATGACCGAAACTTCTGGAGGGGTGAGAATGGAAGAAAAACAAGGATTGCTTATGAGAGAATGTGCAACATTCTAAAAGGAAAATTTCAAACAGCTGCACAAAAAGCAATGATGGACCAAGTGAGAGAAAGCCGGAACCCAGGAAATGCTGAGATCGAAGATCTCACTTTTCTGGCACGGTCTGCACTCATATTGAGAGGATCAGTTGCTCACAAGTCTTGCCTGCCTGCCTGTGTGTATGGACCAGCCGTAGCCAGTGGGTATGACTTCGAAAAAGAGGGTTACTCTTTGGTAGGAGTAGACCCTTTCAAACTGCTTCAAACCAGTCAGGTATACAGTCTAATTAGACCAAACGAGAATCCCGCACACAAGAGCCAGTTGGTGTGGATGGCATGCAATTCTGCTGCATTTGAAGATCTAAGAGTGTCAAGCTTCATCAGAGGAACAAGAGTACTTCCAAGGGGGAAGCTCTCCACTAGAGGAGTACAAATTGCTTCAAATGAAAACATGGATGCTATTGTGTCAAGTACTCTTGAACTGAGAAGCAGATACTGGGCCATAAGAACCAGAAGTGGAGGGAACACTAATCAACAAAGGGCCTCTGCGGGCCAAATCAGCACACAACCTACGTTTTCTGTGCAGAGAAACCTCCCATTTGACAAAGCAACCATCATGGCAGCATTCTCTGGGAATACAGAGGGAAGAACATCAGACATGAGGGCAGAAATCATAAAGATGATGGAAAGTGCAAGACCAGAAGAAGTGTCCTTCCAGGGGCGGGGAGTCTTTGAGCTCTCGGACGAAAGGGCAACGAACCCGATCGTGCCCTCCTTTGACATGAGTAATGAAGGATCTTATTTCTTCGGAGACAATGCAGAGGAGTACGACAATTAAAGAAAA'),
('A_Kawasaki_UTK-04_09_NS', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGGACTCCCACACTGTGTCAAGCTTTCAGGTAGATTGCTTCCTTTGGCATGTCCGCAAACAAGTTGCAGACCAAGATCTAGGCGATGCCCCCTTCCTTGATCGGCTTCGCCGAGATCAGAAGTCTCTAAAGGGAAGAGGCAGTACTCTCGGTCTGAACATCGAAACAGCCACTTGTGTTGGAAAGCAAATAGTAGAGAGGATTCTGAAAGAAGAATCCGATGAGGCACTTAAAATGACCATGGCCTCCGCACTTGCTTCGCGGTACCTAACTGACATGACTGTTGAAGAAATGTCAAGGGACTGGTTCATGCTCATGCCCAAGCAAAAAGTGGCTGGCCCTCTTTGTGTCAGAATGGACCAGGCAACAATGGATAAGAACATCATACTGAAAGCGAATTTCAGTGTGATTTTTGACCGGTTGGAGAATCTGACATTATTAAGGGCTTTCACCGAAGAGGGAGCAATTGTTGGCGAAATTTCACCATTGCCTTCTTTTCCAGGACATACTAATGAGGATGTCAAAAATGCAATTGGGGTCCTCATCGGGGGACTTGAATGGAATGATAACACAGTTCGAGTCTCTGAAACTCTACAGAGATTCGCTTGGAGAAGCAGTAATGAGACTGGGGGACCTCCATTCACTACAACACAGAAACGGAAAATGGCGGGAACAACTAGGTCAGAAGTTTGAAGAAGTAAGATGGCTGATTGAAGAAGTGAGGCATAAATTGAAGACGACAGAGAATAGTTTTGAGCAAATAACATTTATGCAAGCATTACAGCTATTATTTGAAGTGGAACAAGAGATTAGAACGTTTTCGTTTCAGCTTATTTAG'),
('A_Kawasaki_UTK-04_09_PA', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGGAAGATTTTGTACGACAATGCTTCAATCCGATGATTGTCGAGCTTGCAGAAAAAGCAATGAAAGAGTATGGAGAGGACCTGAAAATCGAAACAAACAAATTTGCAGCAATATGCACCCACTTGGAAGTGTGCTTCATGTATTCAGATTTTCATTTCATCAATGAGCAAGGCGAATCAATAATAGTAGAGCCTGAGGACCCAAATGCACTTTTAAAGCACAGATTTGAGATAATAGAGGGACGAGATCGTACAATGGCATGGACAGTTGTAAACAGTATTTGCAACACCACAGGAGCTGAGAAACCAAAGTTCCTGCCAGATCTGTATGATTACAAAGAGAATAGATTCATCGAGATTGGAGTGACAAGGAGGGAAGTTCACATATACTATCTGGAAAAGGCCAACAAAATTAAATCTGAGAAGACACACATTCACATTTTCTCATTCACCGGCGAAGAAATGGCCACAAAGGCTGATTACACTCTCGATGAAGAAAGCAGAGCTAGGATTAAAACCAGATTGTTCACCATAAGACAAGAAATGGCAAGCAGAGGTCTTTGGGACTCCTTTCGTCAGTCCGAAAGAGGCGAAGAAACCATTGAAGAAAGATTTGAAATCACAGGGACAATGCGCAGGCTCGCTGACCAAAGCCTTCCGCCGAACTTCTCCTGCATTGAGAATTTTAGAGCCTATGTGGATGGATTTGAACCGAACGGCTACATTGAGGGCAAGCTTTCTCAAATGTCCAAAGAAGTAAATGCTAGAATTGAGCCTTTTTTGAAAACAACACCTCGACCAATTAGACTTCCGAATGGGCCTCCTTGTTTTCAGCGGTCAAAATTTCTGCTGATGGATTCTTTAAAATTAAGCATTGAGGATCCGAATCATGAAGGTGAGGGGATACCACTATATGATGCAATCAAGTGTATGAGGACATTCTTTGGATGGAAAGAACCCACTGTTGTCAAGCCACACGAGAAGGGAATAAATCCAAATTATCTGTTGTCGTGGAAACAAGTATTGGAAGAGCTGCAGGACATTGAGAGTGAGGAGAAGATTCCAAGAACAAAAAACATGAAAAAAACTAGTCAGCTAAAGTGGGCACTTGGTGAGAACATGGCACCAGAGAAGGTGGATTTTGATGACTGTAAAGATATAAGCGATTTGAAGCAATATGACAGTGACGAACCTGAATTAAGATCATTTTCAAGTTGGATCCAGAATGAGTTCAACAAGGCATGCGAGCTGACCGATTCAATCTGGATAGAGCTTGATGAGATTGGAGAAGATGTGGCTCCGATTGAACACATTGCAAGCATGAGAAGGAATTACTTCACAGCTGAGGTGTCCCACTGCAGAGCCACAGAATATATAATGAAGGGGGTATACATTAATACTGCTTTGCTCAATGCATCCTGTGCAGCAATGGATGATTTCCAACTAATTCCCATGATAAGCAAATGTAGAACTAAAGAGGGAAGGAGAAAGACCAATTTGTACGGCTTCATCGTAAAAGGAAGATCTCACTTAAGGAATGACACCGATGTGGTAAACTTTGTGAGCATGGAGTTTTCCCTCACTGACCCAAGACTTGAGCCACACAAATGGGAGAAGTACTGCGTTCTTGAGATAGGAGATATGCTTCTAAGGAGTGCAATAGGCCAAGTGTCAAGGCCCATGTTCTTGTATGTAAGGACAAATGGAACCTCAAAAATTAAAATGAAATGGGGAATGGAGATGAGGCGTTGCCTCCTCCAATCCCTCCAACAAATAGAGAGCATGATTGAAGCTGAGTCCTCTGTCAAAGAGAAAGACATGACAAAAGAGTTTTTTGAGAATAAATCAGAAACATGGCCCATTGGAGAGTCACCAAAAGGAGTGGAAGAAGGTTCCATTGGGAAAGTATGCAGGACACTGTTGGCTAAGTCAGTATTCAATAGCCTGTATGCATCTCCACAATTAGAAGGATTTTCAGCTGAGTCAAGAAAGTTGCTCCTCATTGTTCAGGCTCTTAGGGACAATCTGGAACCTGGGACCTTTGATCTTGGGGGGCTATATGAAGCAATTGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCTTCTTGGTTCAACTCCTTCCTAACACATGCATTGAGATAG'),
('A_Kawasaki_UTK-04_09_PB1', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGGATGTCAATCCGACATTACTTTTCTTAAAAGTGCCAGCACAAAATGCTATAAGCACAACTTTTCCTTATACTGGTGACCCTCCTTACAGCCATGGGACAGGAACAGGGTACACCATGGATACAGTCAACAGGACACACCAGTACTCAGAAAGAGGAAGATGGACAAAAAATACCGAAACGGGAGCACCGCAACTTAACCCAATTGATGGTCCCTTACCGGAAGACAATGAACCAAGTGGCTATGCCCAAACAGATTGTGTATTAGAAGCAATGGCTTTCCTTGAAGAATCCCATCCCGGTATCTTTGAAAACTCTTGTATTGAAACAATGGAGGTTGTTCAACAAACAAGGGTGGACAAACTGACACAAGGCAGACAGACCTATGACTGGACTCTAAATAGGAACCAGCCTGCTGCCACAGCATTGGCAAACACTATAGAAGTATTCAGATCAAACGGCCTCATAGCAAATGAATCTGGGAGGCTAATAGACTTCCTTAAAGATGTAATGGAGTCGATGGACAGAGGCGAAGTAGAGGTCACAACTCATTTTCAAAGAAAGAGGAGAGTGAGAGACAATGTAACTAAAAAAATGGTGACCCAAAGAACAATAGGCAAAAAGAAACATAAATTAGACAAAAGAAGTTACCTAATTAGGGCATTAACCCTGAACACAATGACCAAAGATGCTGAGAGGGGGAAACTAAAACGCAGAGCAATTGCAACCCCAGGAATGCAAATAAGAGGGTTTGTATACTTTGTTGAGACACTGGCAAGAAGCATATGTGAAAAGCTTGAACAATCAGGATTGCCAGTTGGAGGAAATGAGAAGAAAGCAAAGTTAGCAAATGTTGTAAGGAAGATGATGACCAACTCCCAGGACACTGAAATTTCTTTCACCATAACCGGAGATAACACAAAATGGAACGAAAATCAAAACCCTAGAATGTTCTTGGCCATGATCACATATATAACCAAAAATCAGCCTGAATGGTTCAGAAATATTCTAAGTATTGCTCCAATAATGTTTTCAAATAAGATGGCGAGACTAGGCAAGGGGTACATGTTTGAAAGCAAGAGTATGAAACTGAGAACTCAAATACCTGCAGAGATGCTAGCCAACATAGACTTGAAATATTTCAATGATTCAACAAAAAAGAAAATTGAAAAAATCCGACCATTATTAATAGATGGAACTGCATCATTGAGTCCTGGAATGATGATGGGCATGTTCAATATGTTGAGCACCGTCTTGGGCGTCTCCATTCTGAATCTTGGGCAAAAGAGATACACCAAGACTACTTACTGGTGGGATGGTCTTCAATCGTCTGATGATTTTGCTTTGATTGTGAACGCACCCAACTATGCAGGAATTCAAGCTGGAGTTGACAGGTTTTATCGAACCTGTAAGCTGCTCGGAATTAATATGAGCAAAAAGAAGTCTTACATAAACAGAACAGGTACCTTTGAATTCACGAGCTTTTTCTATCGTTATGGGTTTGTTGCCAATTTTAGCATGGAGCTTCCTAGTTTTGGGGTGTCTGGGGTCAATGAATCTGCAGACATGAGTATTGGAGTCACTGTCATCAAAAACAATATGATAAACAATGACCTTGGCCCAGCAACTGCTCAAATGGCCCTTCAGTTATTTATCAAAGATTACAGGTACACTTATCGATGCCACCGAGGTGACACACAAATACAAACCCGGAGATCATTTGAGATAAAGAAACTATGGGACCAAACCCGCTCAAAAGCTGGACTGTTGGTCTCTGATGGAGGCCCCAATTTGTATAACATTAGAAATCTCCATATTCCTGAAGTTTGCTTGAAATGGGAGTTGATGGATGAGGATTACCAGGGGCGTTTATGCAACCCATTAAACCCGTTTGTCAGCCATAAAGAGATTGAATCTGTGAACAGTGCAGTGATAATGCCGGCACATGGTCCAGCCAAAAATATGGAGTATGACGCTGTTGCAACAACACACTCCTGGGTCCCCAAAAGAAATCGATCCATTTTGAACACGAGCCAAAGGGGGATACTTGAAGATGAGCAAATGTATCAGAGGTGCTGCAATTTATTTGAAAAATTCTTCCCAAGTAGCTCATACAGAAGACCAGTTGGAATATCCAGTATGGTAGAGGCTATGGTCTCAAGAGCCCGAATTGATGCACGGATTGATTTCGAATCTGGAAGGATAAAGAAAGAGGAATTTGCTGAGATCATGAAGATCTGTTCCACCATTGAAGACCTCAGACGGCAAAAATGA'),
('A_Kawasaki_UTK-04_09_PB2', 'Virus', 'A_Kawasaki_UTK-04_09', 'RNA', 'Influenza A', 'ATGGAAAGAATAAAAGAGCTAAGGAATTTGATGTCACAATCTCGCACTCGCGAGATACTTACCAAAACTACTGTAGACCACATGGCCATAATCAAGAAATACACATCAGGAAGACAGGAGAAAAACCCATCACTTAGGATGAAATGGATGATGGCAATGAAATACCCAATTACTGCTGATAAAAGGATAACGGAAATGATTCCTGAAAGAAATGAGCATGGACAGACATTATGGAGTAAGGTGAATGATGCCGGATCAGACCGAGTGATGGTATCACCCCTGGCTGTGACATGGTGGAACAGAAATGGACCAGTGGCAAGTACTATTCACTATCCAAAAATCTACAAAACTTACTTTGAAAAGGTTGAAAGGTTAAAACAAGGAACCTTTGGCCCTGTACACTTTAGAAACCAAGTCAAAATACGCCGAAGAGTCGACATAAATCCTGGTCATGCAGACCTCAGCGCCAAGGAGGCACAGGATGTAATTATGGAAGTTGTTTTCCCTAATGAAGTAGGAGCCAGAATACTAACATCAGAATCGCAATTAACGATAACCAAGGAGAAAAAAGAAGAACTCCAAAATTGCAAAATTTCCCCTTTGATGGTTGCATACATGTTAGAGAGGGAACTTGTCCGCAAAACAAGATTTCTCCCGGTTGCAGGTGGAACAAGCAGTGTGTACATTGAAGTTTTGCATTTAACACAGGGGACATGCTGGGAGCAGATGTACACTCCAGGTGGGGAGGTGAGGAATGATGATGTTGATCAAAGCCTAATTATTGCTGCTAGGAACATAGTGAGAAGAGCTGCAGTATCAGCAGATCCACTAGCATCTTTATTAGAAATGTGCCATAGCACACAGATTGGTGGAACAAGGATGGTGGATATTCTCAGGCAAAATCCAACAGAAGAACAAGCTGTGGACATATGCAAAGCAGCAATGGGGCTGAGAATCAGTTCATCCTTCAGTTTTGGCGGATTCACATTTAAGAGAACAAGTGGATCATCAGTCAAAAGGGAGGAAGAAGTGCTCACGGGCAATCTGCAAACATTGAAACTAACTGTGCATGAGGGATATGAAGAGTTCACAATGGTTGGGAAAAGGGCAACAGCTATACTCAGAAAAGCAACCAGGAGATTGATCCAACTAATAGTGAGTGGAAGAGACGAACAATCAATAGTCGAAGCAATAGTTGTAGCAATGGTATTCTCACAAGAAGATTGCATGATAAAAGCAGTTAGAGGTGATCTGAATTTCGTTAATAGAGCGAATCAGCGGTTGAATCCCATGCATCAACTATTGAGACATTTTCAGAAGGATGCTAAAGTACTTTTCTTAAATTGGGGAGTTGAATCTATTGACAATGTGATGGGAATGATTGGGATATTACCTGATATGACTCCAAGTACCGAGATGTCAATGAGAGGAGTGAGAGTCAGCAAAATGGGTGTAGATGAATACTCCAATGCTGAAAGGGTAGTGGTAAGCATTGACCGTTTTTTGAGAGTCCGGGACCAAAGAGGAAATGTGCTACTGTCTCCAGAGGAAGTAAGTGAAACACAAGGGACAGAGAAACTGACAATAACTTATTCTTCATCAATGATGTGGGAGATTAATGGCCCTGAGTCAGTCTTGATCAATACCTATCAGTGGATCATCAGAAACTGGGAGACTGTTAAAATTCAGTGGTCTCAGAATCCTACGATGCTGTACAATAAAATGGAATTTGAACCATTTCAGTCTCTAGTCCCCAAGGCCATTAGAGGCCAATACAGTGGGTTTGTTAGAACTCTATTCCAACAAATGAGGGATGTGCTTGGGACTTTTGACACAACTCAGATAATAAAACTTCTTCCCTTTGCAGCCGCTCCTCCAAAGCAAAGCAGAATGCAATTCTCGTCATTAACTGTGAATGTGAGGGGATCAGGAATGAGAATACTTGTGAGGGGTAATTCTCCAGTATTCAACTACAACAAGACTACCAAGAGACTCACAGTCCTCGGAAAGGATGCTGGCACTTTAACTGAAGACCCAGATGAAGGCACAGCTGGAGTGGAATCTGCGGTTCTAAGGGGGTTCCTCATTTTAGGCAAAGAAGATAGAAGATATGGGCCAGCATTAAGCATCAATGAATTGAGCAACCTTGCGAAAGGGGAAAAAGCTAATGTGCTAATTGGGCAAGGGGATGTAGTGTTGGTAATGAAACGAAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAA'),
('A_California_04_09_HA', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGAAGGCAATACTAGTAGTTCTGCTATATACATTTGCAACCGCAAATGCAGACACATTATGTATAGGTTATCATGCGAACAATTCAACAGACACTGTAGACACAGTACTAGAAAAGAATGTAACAGTAACACACTCTGTTAACCTTCTAGAAGACAAGCATAACGGGAAACTATGCAAACTAAGAGGGGTAGCCCCATTGCATTTGGGTAAATGTAACATTGCTGGCTGGATCCTGGGAAATCCAGAGTGTGAATCACTCTCCACAGCAAGCTCATGGTCCTACATTGTGGAAACACCTAGTTCAGACAATGGAACGTGTTACCCAGGAGATTTCATCGATTATGAGGAGCTAAGAGAGCAATTGAGCTCAGTGTCATCATTTGAAAGGTTTGAGATATTCCCCAAGACAAGTTCATGGCCCAATCATGACTCGAACAAAGGTGTAACGGCAGCATGTCCTCATGCTGGAGCAAAAAGCTTCTACAAAAATTTAATATGGCTAGTTAAAAAAGGAAATTCATACCCAAAGCTCAGCAAATCCTACATTAATGATAAAGGGAAAGAAGTCCTCGTGCTATGGGGCATTCACCATCCATCTACTAGTGCTGACCAACAAAGTCTCTATCAGAATGCAGATACATATGTTTTTGTGGGGTCATCAAGATACAGCAAGAAGTTCAAGCCGGAAATAGCAATAAGACCCAAAGTGAGGGATCAAGAAGGGAGAATGAACTATTACTGGACACTAGTAGAGCCGGGAGACAAAATAACATTCGAAGCAACTGGAAATCTAGTGGTACCGAGATATGCATTCGCAATGGAAAGAAATGCTGGATCTGGTATTATCATTTCAGATACACCAGTCCACGATTGCAATACAACTTGTCAAACACCCAAGGGTGCTATAAACACCAGCCTCCCATTTCAGAATATACATCCGATCACAATTGGAAAATGTCCAAAATATGTAAAAAGCACAAAATTGAGACTGGCCACAGGATTGAGGAATATCCCGTCTATTCAATCTAGAGGCCTATTTGGGGCCATTGCCGGTTTCATTGAAGGGGGGTGGACAGGGATGGTAGATGGATGGTACGGTTATCACCATCAAAATGAGCAGGGGTCAGGATATGCAGCCGACCTGAAGAGCACACAGAATGCCATTGACGAGATTACTAACAAAGTAAATTCTGTTATTGAAAAGATGAATACACAGTTCACAGCAGTAGGTAAAGAGTTCAACCACCTGGAAAAAAGAATAGAGAATTTAAATAAAAAAGTTGATGATGGTTTCCTGGACATTTGGACTTACAATGCCGAACTGTTGGTTCTATTGGAAAATGAAAGAACTTTGGACTACCACGATTCAAATGTGAAGAACTTATATGAAAAGGTAAGAAGCCAGCTAAAAAACAATGCCAAGGAAATTGGAAACGGCTGCTTTGAATTTTACCACAAATGCGATAACACGTGCATGGAAAGTGTCAAAAATGGGACTTATGACTACCCAAAATACTCAGAGGAAGCAAAATTAAACAGAGAAGAAATAGATGGGGTAAAGCTGGAATCAACAAGGATTTACCAGATTTTGGCGATCTATTCAACTGTCGCCAGTTCATTGGTACTGGTAGTCTCCCTGGGGGCAATCAGTTTCTGGATGTGCTCTAATGGGTCTCTACAGTGTAGAATATGTATTTAA'),
('A_California_04_09_M', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGAGTCTTCTAACCGAGGTCGAAACGTACGTTCTTTCTATCATCCCGTCAGGCCCCCTCAAAGCCGAGATCGCGCAGAGACTGGAAAGTGTCTTTGCAGGAAAGAACACAGATCTTGAGGCTCTCATGGAATGGCTAAAGACAAGACCAATCTTGTCACCTCTGACTAAGGGAATTTTAGGATTTGTGTTCACGCTCACCGTGCCCAGTGAGCGAGGACTGCAGCGTAGACGCTTTGTCCAAAATGCCCTAAATGGGAATGGGGACCCGAACAACATGGATAGAGCAGTTAAACTATACAAGAAGCTCAAAAGAGAAATAACGTTCCATGGGGCCAAGGAGGTGTCACTAAGCTATTCAACTGGTGCACTTGCCAGTTGCATGGGCCTCATATACAACAGGATGGGAACAGTGACCACAGAAGCTGCTTTTGGTCTAGTGTGTGCCACTTGTGAACAGATTGCTGATTCACAGCATCGGTCTCACAGACAGATGGCTACTACCACCAATCCACTAATCAGGCATGAAAACAGAATGGTGCTGGCTAGCACTACGGCAAAGGCTATGGAACAGATGGCTGGATCGAGTGAACAGGCAGCGGAGGCCATGGAGGTTGCTAATCAGACTAGGCAGATGGTACATGCAATGAGAACTATTGGGACTCATCCTAGCTCCAGTGCTGGTCTGAAAGATGACCTTCTTGAAAATTTGCAGGCCTACCAGAAGCGAATGGGAGTGCAGATGCAGCGATTCAAGTGATCCTCTCGTCATTGCAGCAAATATCATTGGGATCTTGCACCTGATATTGTGGATTACTGATCGTCTTTTTTTCAAATGTATTTATCGTCGCTTTAAATACGGTTTGAAAAGAGGGCCTTCTACGGAAGGAGTGCCTGAGTCCATGAGGGAAGAATATCAACAGGAACAGCAGAGTGCTGTGGATGTTGACGATGGTCATTTTGTCAACATAGAGCTAGAGTAA'),
('A_California_04_09_NA', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGAATCCAAACCAAAAGATAATAACCATTGGTTCGGTCTGTATGACAATTGGAATGGCTAACTTAATATTACAAATTGGAAACATAATCTCAATATGGATTAGCCACTCAATTCAACTTGGGAATCAAAATCAGATTGAAACATGCAATCAAAGCGTCATTACTTATGAAAACAACACTTGGGTAAATCAGACATATGTTAACATCAGCAACACCAACTTTGCTGCTGGACAGTCAGTGGTTTCCGTGAAATTAGCGGGCAATTCCTCTCTCTGCCCTGTTAGTGGATGGGCTATATACAGTAAAGACAACAGTGTAAGAATCGGTTCCAAGGGGGATGTGTTTGTCATAAGGGAACCATTCATATCATGCTCCCCCTTGGAATGCAGAACCTTCTTCTTGACTCAAGGGGCCTTGCTAAATGACAAACATTCCAATGGAACCATTAAAGACAGGAGCCCATATCGAACCCTAATGAGCTGTCCTATTGGTGAAGTTCCCTCTCCATACAACTCAAGATTTGAGTCAGTCGCTTGGTCAGCAAGTGCTTGTCATGATGGCATCAATTGGCTAACAATTGGAATTTCTGGCCCAGACAATGGGGCAGTGGCTGTGTTAAAGTACAACGGCATAATAACAGACACTATCAAGAGTTGGAGAAACAATATATTGAGAACACAAGAGTCTGAATGTGCATGTGTAAATGGTTCTTGCTTTACTGTAATGACCGATGGACCAAGTAATGGACAGGCCTCATACAAGATCTTCAGAATAGAAAAGGGAAAGATAGTCAAATCAGTCGAAATGAATGCCCCTAATTATCACTATGAGGAATGCTCCTGTTATCCTGATTCTAGTGAAATCACATGTGTGTGCAGGGATAACTGGCATGGCTCGAATCGACCGTGGGTGTCTTTCAACCAGAATCTGGAATATCAGATAGGATACATATGCAGTGGGATTTTCGGAGACAATCCACGCCCTAATGATAAGACAGGCAGTTGTGGTCCAGTATCGTCTAATGGAGCAAATGGAGTAAAAGGGTTTTCATTCAAATACGGCAATGGTGTTTGGATAGGGAGAACTAAAAGCATTAGTTCAAGAAACGGTTTTGAGATGATTTGGGATCCGAACGGATGGACTGGGACAGACAATAACTTCTCAATAAAGCAAGATATCGTAGGAATAAATGAGTGGTCAGGATATAGCGGGAGTTTTGTTCAGCATCCAGAACTAACAGGGCTGGATTGTATAAGACCTTGCTTCTGGGTTGAACTAATCAGAGGGCGACCCAAAGAGAACACAATCTGGACTAGCGGGAGCAGCATATCCTTTTGTGGTGTAAACAGTGACACTGTGGGTTGGTCTTGGCCAGACGGTGCTGAGTTGCCATTTACCATTGACAAGTAA'),
('A_California_04_09_NP', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGGCGTCTCAAGGCACCAAACGATCATATGAACAAATGGAGACTGGTGGGGAGCGCCAGGATGCCACAGAAATCAGAGCATCTGTCGGAAGAATGATTGGTGGAATCGGGAGATTCTACATCCAAATGTGCACTGAACTCAAACTCAGTGATTATGATGGACGACTAATCCAGAATAGCATAACAATAGAGAGGATGGTGCTTTCTGCTTTTGATGAGAGAAGAAATAAATACCTAGAAGAGCATCCCAGTGCTGGGAAGGACCCTAAGAAAACAGGAGGACCCATATATAGAAGAGTAGACGGAAAGTGGATGAGAGAACTCATCCTTTATGACAAAGAAGAAATAAGGAGAGTTTGGCGCCAAGCAAACAATGGCGAAGATGCAACAGCAGGTCTTACTCATATCATGATTTGGCATTCCAACCTGAATGATGCCACATATCAGAGAACAAGAGCGCTTGTTCGCACCGGAATGGATCCCAGAATGTGCTCTCTAATGCAAGGTTCAACACTTCCCAGAAGGTCTGGTGCCGCAGGTGCTGCGGTGAAAGGAGTTGGAACAATAGCAATGGAGTTAATCAGAATGATCAAACGTGGAATCAATGACCGAAATTTCTGGAGGGGTGAAAATGGACGAAGGACAAGGGTTGCTTATGAAAGAATGTGCAATATCCTCAAAGGAAAATTTCAAACAGCTGCCCAGAGGGCAATGATGGATCAAGTAAGAGAAAGTCGAAACCCAGGAAACGCTGAGATTGAAGACCTCATTTTCCTGGCACGGTCAGCACTCATTCTGAGGGGATCAGTTGCACATAAATCCTGCCTGCCTGCTTGTGTGTATGGGCTTGCAGTAGCAAGTGGGCATGACTTTGAAAGGGAAGGGTACTCACTGGTCGGGATAGACCCATTCAAATTACTCCAAAACAGCCAAGTGGTCAGCCTGATGAGACCAAATGAAAACCCAGCTCACAAGAGTCAATTGGTGTGGATGGCATGCCACTCTGCTGCATTTGAAGATTTAAGAGTATCAAGTTTCATAAGAGGAAAGAAAGTGATTCCAAGAGGAAAGCTTTCCACAAGAGGGGTCCAGATTGCTTCAAATGAGAATGTGGAAACCATGGACTCCAATACCCTGGAACTGAGAAGCAGATACTGGGCCATAAGGACCAGGAGTGGAGGAAATACCAATCAACAAAAGGCATCCGCAGGCCAGATCAGTGTGCAGCCTACATTCTCAGTGCAGCGGAATCTCCCTTTTGAAAGAGCAACCGTTATGGCAGCATTCAGCGGGAACAATGAAGGACGGACATCCGACATGCGAACAGAAGTTATAAGAATGATGGAAAGTGCAAAGCCAGAAGATTTGTCCTTCCAGGGGCGGGGAGTCTTCGAGCTCTCGGACGAAAAGGCAACGAACCCGATCGTGCCTTCCTTTGACATGAGTAATGAAGGGTCTTATTTCTTCGGAGACAATGCAGAGGAGTATGACAGTTGA'),
('A_California_04_09_NS', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGGACTCCAACACCATGTCAAGCTTTCAGGTAGACTGTTTCCTTTGGCATATCCGCAAGCGATTTGCAGACAATGGATTGGGTGATGCCCCATTCCTTGATCGGCTCCGCCGAGATCAAAAGTCCTTAAAAGGAAGAGGCAACACCCTTGGCCTCGATATCGAAACAGCCACTCTTGTTGGGAAACAAATCGTGGAATGGATCTTGAAAGAGGAATCCAGCGAGACACTTAGAATGACAATTGCATCTGTACCTACTTCGCGCTACCTTTCTGACATGACCCTCGAGGAAATGTCACGAGACTGGTTCATGCTCATGCCTAGGCAAAAGATAATAGGCCCTCTTTGCGTGCGATTGGACCAGGCGATCATGGAAAAGAACATAGTACTGAAAGCGAACTTCAGTGTAATCTTTAACCGATTAGAGACCTTGATACTACTAAGGGCTTTCACTGAGGAGGGAGCAATAGTTGGAGAAATTTCACCATTACCTTCTCTTCCAGGACATACTTATGAGGATGTCAAAAATGCAGTTGGGGTCCTCATCGGAGGACTTGAATGGAATGGTAACACGGTTCGAGTCTCTGAAAATATACAGAGATTCGCTTGGAGAAACTGTGATGAGAATGGGAGACCTTCACTACCTCCAGAGCAGAAATGAAAAGTGGCGAGAGCAATTGGGACAGAAATTTGAGGAAATAAGGTGGTTAATTGAAGAAATGCGGCACAGATTGAAAGCGACAGAGAATAGTTTCGAACAAATAACATTTATGCAAGCCTTACAACTACTGCTTGAAGTAGAACAAGAGATAAGAGCTTTCTCGTTTCAGCTTATTTAA'),
('A_California_04_09_PA', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGGAAGACTTTGTGCGACAATGCTTCAATCCAATGATCGTCGAGCTTGCGGAAAAGGCAATGAAAGAATATGGGGAAGATCCGAAAATCGAAACTAACAAGTTTGCTGCAATATGCACACATTTGGAAGTTTGTTTCATGTATTCGGATTTCCATTTCATCGACGAACGGGGTGAATCAATAATTGTAGAATCTGGTGACCCGAATGCACTATTGAAGCACCGATTTGAGATAATTGAAGGAAGAGACCGAATCATGGCCTGGACAGTGGTGAACAGTATATGTAACACAACAGGGGTAGAGAAGCCTAAATTTCTTCCTGATTTGTATGATTACAAAGAGAACCGGTTCATTGAAATTGGAGTAACACGGAGGGAAGTCCACATATATTACCTAGAGAAAGCCAACAAAATAAAATCTGAGAAGACACACATTCACATCTTTTCATTCACTGGAGAGGAGATGGCCACCAAAGCGGACTACACCCTTGACGAAGAGAGCAGGGCAAGAATCAAAACTAGGCTTTTCACTATAAGACAAGAAATGGCCAGTAGGAGTCTATGGGATTCCTTTCGTCAGTCCGAAAGAGGCGAAGAGACAATTGAAGAAAAATTTGAGATTACAGGAACTATGCGCAAGCTTGCCGACCAAAGTCTCCCACCGAACTTCCCCAGCCTTGAAAACTTTAGAGCCTATGTAGATGGATTCGAGCCGAACGGCTGCATTGAGGGCAAGCTTTCCCAAATGTCAAAAGAAGTGAACGCCAAAATTGAACCATTCTTGAGGACGACACCACGCCCCCTCAGATTGCCTGATGGGCCTCTTTGCCATCAGCGGTCAAAGTTCCTGCTGATGGATGCTCTGAAATTAAGTATTGAAGACCCGAGTCACGAGGGGGAGGGAATACCACTATATGATGCAATCAAATGCATGAAGACATTCTTTGGCTGGAAAGAGCCTAACATAGTCAAACCACATGAGAAAGGCATAAATCCCAATTACCTCATGGCTTGGAAGCAGGTGCTAGCAGAGCTACAGGACATTGAAAATGAAGAGAAGATCCCAAGGACAAAGAACATGAAGAGAACAAGCCAATTGAAGTGGGCACTCGGTGAAAATATGGCACCAGAAAAAGTAGACTTTGATGACTGCAAAGATGTTGGAGACCTTAAACAGTATGACAGTGATGAGCCAGAGCCCAGATCTCTAGCAAGCTGGGTCCAAAATGAATTCAATAAGGCATGTGAATTGACTGATTCAAGCTGGATAGAACTTGATGAAATAGGAGAAGATGTTGCCCCGATTGAACATATCGCAAGCATGAGGAGGAACTATTTTACAGCAGAAGTGTCCCACTGCAGGGCTACTGAATACATAATGAAGGGAGTGTACATAAATACGGCCTTGCTCAATGCATCCTGTGCAGCCATGGATGACTTTCAGCTGATCCCAATGATAAGCAAATGTAGGACCAAAGAAGGAAGACGGAAAACAAACCTGTATGGGTTCATTATAAAAGGAAGGTCTCATTTGAGAAATGATACTGATGTGGTGAACTTTGTAAGTATGGAGTTCTCACTCACTGACCCGAGACTGGAGCCACACAAATGGGAAAAATACTGTGTTCTTGAAATAGGAGACATGCTCTTGAGGACTGCGATAGGCCAAGTGTCGAGGCCCATGTTCCTATATGTGAGAACCAATGGAACCTCCAAGATCAAGATGAAATGGGGCATGGAAATGAGGCGCTGCCTTCTTCAGTCTCTTCAGCAGATTGAGAGCATGATTGAGGCCGAGTCTTCTGTCAAAGAGAAAGACATGACCAAGGAATTCTTTGAAAACAAATCGGAAACATGGCCAATCGGAGAGTCACCCAGGGGAGTGGAGGAAGGCTCTATTGGGAAAGTGTGCAGGACCTTACTGGCAAAATCTGTATTCAACAGTCTATATGCGTCTCCACAACTTGAGGGGTTTTCGGCTGAATCTAGAAAATTGCTTCTCATTGTTCAGGCACTTAGGGACAACCTGGAACCTGGAACCTTCGATCTTGGGGGGCTATATGAAGCAATCGAGGAGTGCCTGATTAATGATCCCTGGGTTTTGCTTAATGCATCTTGGTTCAACTCCTTCCTCACACATGCACTGAAGTAG'),
('A_California_04_09_PB1', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGGATGTCAATCCGACTCTACTTTTCCTAAAAATTCCAGCGCAAAATGCCATAAGCACCACATTCCCTTATACTGGAGATCCTCCATACAGCCATGGAACAGGAACAGGATACACCATGGACACAGTAAACAGAACACACCAATACTCAGAAAAGGGAAAGTGGACGACAAACACAGAGACTGGTGCACCCCAGCTCAACCCGATTGATGGACCACTACCTGAGGATAATGAACCAAGTGGGTATGCACAAACAGACTGTGTTCTAGAGGCTATGGCTTTCCTTGAAGAATCCCACCCAGGAATATTTGAGAATTCATGCCTTGAAACAATGGAAGTTGTTCAACAAACAAGGGTAGATAAACTAACTCAAGGTCGCCAGACTTATGATTGGACATTAAACAGAAATCAACCGGCAGCAACTGCATTGGCCAACACCATAGAAGTCTTTAGATCGAATGGCCTAACAGCTAATGAGTCAGGAAGGCTAATAGATTTCTTAAAGGATGTAATGGAATCAATGAACAAAGAGGAAATAGAGATAACAACCCACTTTCAAAGAAAAAGGAGAGTAAGAGACAACATGACCAAGAAGATGGTCACGCAAAGAACAATAGGGAAGAAAAAACAAAGACTGAATAAGAGAGGCTATCTAATAAGAGCACTGACATTAAATACGATGACCAAAGATGCAGAGAGAGGCAAGTTAAAAAGAAGGGCTATCGCAACACCTGGGATGCAGATTAGAGGTTTCGTATACTTTGTTGAAACTTTAGCTAGGAGCATTTGCGAAAAGCTTGAACAGTCTGGGCTCCCAGTAGGGGGCAATGAAAAGAAGGCCAAACTGGCAAATGTTGTGAGAAAGATGATGACTAATTCACAAGACACAGAGATTTCTTTCACAATCACTGGGGACAACACTAAGTGGAATGAAAATCAAAATCCTCGAATGTTCCTGGCGATGATTACATATATCACCAGAAATCAACCCGAGTGGTTCAGAAACATCCTGAGCATGGCACCCATAATGTTCTCAAACAAAATGGCAAGACTAGGGAAAGGGTACATGTTCGAGAGTAAAAGAATGAAGATTCGAACACAAATACCAGCAGAAATGCTAGCAAGCATTGACCTGAAGTACTTCAATGAATCAACAAAGAAGAAAATTGAGAAAATAAGGCCTCTTCTAATAGATGGCACAGCATCACTGAGTCCTGGGATGATGATGGGCATGTTCAACATGCTAAGTACGGTCTTGGGAGTCTCGATACTGAATCTTGGACAAAAGAAATACACCAAGACAATATACTGGTGGGATGGGCTCCAATCATCCGACGATTTTGCTCTCATAGTGAATGCACCAAACCATGAGGGAATACAAGCAGGAGTGGACAGATTCTACAGGACCTGCAAGTTAGTGGGAATCAACATGAGCAAAAAGAAGTCCTATATAAATAAGACAGGGACATTTGAATTCACAAGCTTTTTTTATCGCTATGGATTTGTGGCTAATTTTAGCATGGAGCTACCCAGCTTTGGAGTGTCTGGAGTAAATGAATCAGCTGACATGAGTATTGGAGTAACAGTGATAAAGAACAACATGATAAACAATGACCTTGGACCTGCAACGGCCCAGATGGCTCTTCAATTGTTCATCAAAGACTACAGATACACATATAGGTGCCATAGGGGAGACACACAAATTCAGACGAGAAGATCATTTGAGTTAAAGAAGCTGTGGGATCAAACCCAATCAAAAGTAGGGCTATTAGTATCAGATGGAGGACCAAACTTATACAATATACGGAATCTTCACATTCCTGAAGTCTGCTTAAAATGGGAGCTAATGGATGATGATTATCGGGGAAGACTTTGTAATCCCCTGAATCCCTTTGTCAGTCATAAAGAGATTGATTCTGTAAACAATGCTGTGGTAATGCCAGCCCATGGTCCAGCCAAAAGCATGGAATATGATGCCGTTGCAACTACACATTCCTGGATTCCCAAGAGGAATCGTTCTATTCTCAACACAAGCCAAAGGGGAATTCTTGAGGATGAACAGATGTACCAGAAGTGCTGCAATCTATTCGAGAAATTTTTCCCTAGCAGTTCATATAGGAGACCGGTTGGAATTTCTAGCATGGTGGAGGCCATGGTGTCTAGGGCCCGGATTGATGCCAGGGTCGACTTCGAGTCTGGACGGATCAAGAAAGAAGAGTTCTCTGAGATCATGAAGATCTGTTCCACCATTGAAGAACTCAGACGGCAAAAATAA'),
('A_California_04_09_PB2', 'Virus', 'A_California_04_09', 'RNA', 'Influenza A', 'ATGGAGAGAATAAAAGAACTGAGAGATCTAATGTCGCAGTCCCGCACTCGCGAGATACTCACTAAGACCACTGTGGACCATATGGCCATAATCAAAAAGTACACATCAGGAAGGCAAGAGAAGAACCCCGCACTCAGAATGAAGTGGATGATGGCAATGAGATACCCAATTACAGCAGACAAGAGAATAATGGACATGATTCCAGAGAGGAATGAACAAGGACAAACCCTCTGGAGCAAAACAAACGATGCTGGATCAGACCGAGTGATGGTATCACCTCTGGCCGTAACATGGTGGAATAGGAATGGCCCAACAACAAGTACAGTTCATTACCCTAAGGTATATAAAACTTATTTCGAAAAGGTCGAAAGGTTGAAACATGGTACCTTCGGCCCTGTCCACTTCAGAAATCAAGTTAAAATAAGGAGGAGAGTTGATACAAACCCTGGCCATGCAGATCTCAGTGCCAAGGAGGCACAGGATGTGATTATGGAAGTTGTTTTCCCAAATGAAGTGGGGGCAAGAATACTGACATCAGAGTCACAGCTGGCAATAACAAAAGAGAAGAAAGAAGAGCTCCAGGATTGTAAAATTGCTCCCTTGATGGTGGCGTACATGCTAGAAAGAGAATTGGTCCGTAAAACAAGGTTTCTCCCAGTAGCCGGCGGAACAGGCAGTGTTTATATTGAAGTGTTGCACTTAACCCAAGGGACGTGCTGGGAGCAGATGTACACTCCAGGAGGAGAAGTGAGAAATGATGATGTTGACCAAAGTTTGATTATCGCTGCTAGAAACATAGTAAGAAGAGCAGCAGTGTCAGCAGACCCATTAGCATCTCTCTTGGAAATGTGCCACAGCACACAGATTGGAGGAGTAAGGATGGTGGACATCCTTAGACAGAATCCAACTGAGGAACAAGCCGTAGACATATGCAAGGCAGCAATAGGGTTGAGGATTAGCTCATCTTTCAGTTTTGGTGGGTTCACTTTCAAAAGGACAAGCGGATCATCAGTCAAGAAAGAAGAAGAAGTGCTAACGGGCAACCTCCAAACACTGAAAATAAGAGTACATGAAGGGTATGAAGAATTCACAATGGTTGGGAGAAGAGCAACAGCTATTCTCAGAAAGGCAACCAGGAGATTGATCCAGTTGATAGTAAGCGGGAGAGACGAGCAGTCAATTGCTGAGGCAATAATTGTGGCCATGGTATTCTCACAGGAGGATTGCATGATCAAGGCAGTTAGGGGCGATCTGAACTTTGTCAATAGGGCAAACCAGCGACTGAACCCCATGCACCAACTCTTGAGGCATTTCCAAAAAGATGCAAAAGTGCTTTTCCAGAACTGGGGAATTGAATCCATCGACAATGTGATGGGAATGATCGGAATACTGCCCGACATGACCCCAAGCACGGAGATGTCGCTGAGAGGGATAAGAGTCAGCAAAATGGGAGTAGATGAATACTCCAGCACGGAGAGAGTGGTAGTGAGTATTGACCGATTTTTAAGGGTTAGAGATCAAAGAGGGAACGTACTATTGTCTCCCGAAGAAGTCAGTGAAACGCAAGGAACTGAGAAGTTGACAATAACTTATTCGTCATCAATGATGTGGGAGATCAATGGCCCTGAGTCAGTGCTAGTCAACACTTATCAATGGATAATCAGGAACTGGGAAATTGTGAAAATTCAATGGTCACAAGATCCCACAATGTTATACAACAAAATGGAATTTGAACCATTTCAGTCTCTTGTCCCTAAGGCAACCAGAAGCCGGTACAGTGGATTCGTAAGGACACTGTTCCAGCAAATGCGGGATGTGCTTGGGACATTTGACACTGTCCAAATAATAAAACTTCTCCCCTTTGCTGCTGCCCCACCAGAACAGAGTAGGATGCAATTTTCCTCATTGACTGTGAATGTGAGAGGATCAGGGTTGAGGATACTGGTAAGAGGCAATTCTCCAGTATTCAATTACAACAAGGCAACCAAACGACTTACAGTTCTTGGAAAGGATGCAGGTGCATTGACTGAAGATCCAGATGAAGGCACATCTGGGGTGGAGTCTGCTGTCCTGAGAGGATTTCTCATTTTGGGCAAAGAAGACAAGAGATATGGCCCAGCATTAAGCATCAATGAACTGAGCAATCTTGCAAAAGGAGAGAAGGCTAATGTGCTAATTGGGCAAGGGGACGTAGTGTTGGTAATGAAACGAAAACGGGACTCTAGCATACTTACTGACAGCCAGACAGCGACCAAAAGAATTCGGATGGCCATCAATTAG'),
('SHIV-1157ipd3N4', 'Virus', 'SHIV-1157ipd3N4', 'RNA', 'SIV', 'CAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGCTTGCTTAAAGCCCTCTTCAATAAAGCTGCCATTTTAGAAGTAAGCTAGTGTGTGTTCCCATCTCTCCTAGCCGCCGCCTGGTCAACTCGGTACTCAATAATAAGAAGACCCTGGTCTGTTAGGACCCTTTCTGCTTTGGGAAACCGAAGCAGGAAAATCCCTAGCAGATTGGCGCCTGAACAGGGACTTGAAGGAGAGTGAGAGACTCCTGAGTACGGCTGAGTGAAGGCAGTAAGGGCGGCAGGAACCAACCACGACGGAGTGCTCCTATAAAGGCGCGGGTCGGTACCAGACGGCGTGAGGAGCGGGAGAGGAAGAGGCCTCCGGTTGCAGGTAAGTGCAACACAAAAAAGAAATAGCTGTCTTTTATCCAGGAAGGGGTAATAAGATAGAGTGGGAGATGGGCGTGAGAAACTCCGTCTTGTCAGGGAAGAAAGCAGATGAATTAGAAAAAATTAGGCTACGACCCAACGGAAAGAAAAAGTACATGTTGAAGCATGTAGTATGGGCAGCAAATGAATTAGATAGATTTGGATTAGCAGAAAGCCTGTTGGAGAACAAAGAAGGATGTCAAAAAATACTTTCGGTCTTAGCTCCATTAGTGCCAACAGGCTCAGAAAATTTAAAAAGCCTTTATAATACTGTCTGCGTCATCTGGTGCATTCACGCAGAAGAGAAAGTGAAACACACTGAGGAAGCAAAACAGATAGTGCAGAGACACCTAGTGGTGGAAACAGGAACAACAGAAACTATGCCAAAAACAAGTAGACCAACAGCACCATCTAGCGGCAGAGGAGGAAATTACCCAGTACAACAAATAGGTGGTAACTATGTCCACCTGCCATTAAGCCCGAGAACATTAAATGCCTGGGTAAAATTGATAGAGGAAAAGAAATTTGGAGCAGAAGTAGTGCCAGGATTTCAGGCACTGTCAGAAGGTTGCACCCCCTATGACATTAATCAGATGTTAAATTGTGTGGGAGACCATCAAGCGGCTATGCAGATTATCAGAGATATTATAAACGAGGAGGCTGCAGATTGGGACTTGCAGCACCCACAACCAGCTCCACAACAAGGACAACTTAGGGAGCCGTCAGGATCAGATATTGCAGGAACAACTAGTTCAGTAGATGAACAAATCCAGTGGATGTACAGACAACAGAACCCCATACCAGTAGGCAACATTTACAGGAGATGGATCCAACTGGGGTTGCAAAAATGTGTCAGAATGTATAACCCAACAAACATTCTAGATGTAAAACAAGGGCCAAAAGAGCCATTTCAGAGCTATGTAGACAGGTTCTACAAAAGTTTAAGAGCAGAACAGACAGATGCAGCAGTAAAGAATTGGATGACTCAAACACTGCTGATTCAAAATGCTAACCCAGATTGCAAGCTAGTGCTGAAGGGGCTGGGTGTGAATCCCACCCTAGAAGAAATGCTGACGGCTTGTCAAGGAGTAGGGGGGCCGGGACAGAAGGCTAGATTAATGGCAGAAGCCCTGAAAGAGGCCCTCGCACCAGTGCCAATCCCTTTTGCAGCAGCCCAACAGAGGGGACCAAGAAAGCCAATTAAGTGTTGGAATTGTGGGAAAGAGGGACACTCTGCAAGGCAATGCAGAGCCCCAAGAAGACAGGGATGCTGGAAATGTGGAAAAATGGACCATGTTATGGCCAAATGCCCAGACAGACAGGCGGGTTTTTTAGGCCTTGGTCCATGGGGAAAGAAGCCCCGCAATTTCCCCATGGCTCAAGTGCATCAGGGGCTGATGCCAACTGCTCCCCCAGAGGACCCAGCTGTGGATCTGCTAAAGAACTACATGCAGTTGGGCAAGCAGCAGAGAGAAAAGCAGAGAGAAAGCAGAGAGAAGCCTTACAAGGAGGTGACAGAGGATTTGCTGCACCTCAATTCTCTCTTTGGAGGAGACCAGTAGTCACTGCTCATATTGAAGGACAGCCTGTAGAAGTATTACTGGATACAGGGGCTGATGATTCTATTGTAACAGGAATAGAGTTAGGTCCACATTATACCCCAAAAATAGTAGGAGGAATAGGAGGTTTTATTAATACTAAAGAATACAAAAATGTAGAAATAGAAGTTTTAGGCAAAAGGATTAAAGGGACAATCATGACAGGGGACACCCCGATTAACATTTTTGGTAGAAATTTGCTAACAGCTCTGGGGATGTCTCTAAATTTTCCCATAGCTAAAGTAGAGCCTGTAAAAGTCGCCTTAAAGCCAGGAAAGGATGGACCAAAATTGAAGCAGTGGCCATTATCAAAAGAAAAGATAGTTGCATTAAGAGAAATCTGTGAAAAGATGGAAAAGGATGGTCAGTTGGAGGAAGCTCCCCCGACCAATCCATACAACACCCCCACATTTGCTATAAAGAAAAAGGATAAGAACAAATGGAGAATGCTGATAGATTTTAGGGAACTAAATAGGGTCACTCAGGACTTTACGGAAGTCCAATTAGGAATACCACACCCTGCAGGACTAGCAAAAAGGAAAAGAATTACAGTACTGGATATAGGTGATGCATATTTCTCCATACCTCTAGATGAAGAATTTAGGCAGTACACTGCCTTTACTTTACCATCAGTAAATAATGCAGAGCCAGGAAAACGATACATTTATAAGGTTCTGCCTCAGGGATGGAAGGGGTCACCAGCCATCTTCCAATACACTATGAGACATGTGCTAGAACCCTTCAGGAAGGCAAATCCAGATGTGACCTTAGTCCAGTATATGGATGACATCTTAATAGCTAGTGACAGGACAGACCTGGAACATGACAGGGTAGTTTTACAGTCAAAGGAACTCTTGAATAGCATAGGGTTTTCTACCCCAGAAGAGAAATTCCAAAAAGATCCCCCATTTCAATGGATGGGGTACGAATTGTGGCCAACAAAATGGAAGTTGCAAAAGATAGAGTTGCCACAAAGAGAGACCTGGACAGTGAATGATATACAGAAGTTAGTAGGAGTATTAAATTGGGCAGCTCAAATTTATCCAGGTATAAAAACCAAACATCTCTGTAGGTTAATTAGAGGAAAAATGACTCTAACAGAGGAAGTTCAGTGGACTGAGATGGCAGAAGCAGAATATGAGGAAAATAAAATAATTCTCAGTCAGGAACAAGAAGGATGTTATTACCAAGAAGGCAAGCCATTAGAAGCCACGGTAATAAAGAGTCAGGACAATCAGTGGTCTTATAAAATTCACCAAGAAGACAAAATACTGAAAGTAGGAAAATTTGCAAAGATAAAGAATACACATACCAATGGAGTGAGACTATTAGCACATGTAATACAGAAAATAGGAAAGGAAGCAATAGTGATCTGGGGACAGGTCCCAAAATTCCACTTACCAGTTGAGAAGGATGTATGGGAACAGTGGTGGACAGACTATTGGCAGGTAACCTGGATACCGGAATGGGATTTTATCTCAACACCACCGCTAGTAAGATTAGTCTTCAATCTAGTGAAGGACCCTATAGAGGGAGAAGAAACCTATTATACAGATGGATCATGTAATAAACAGTCAAAAGAAGGGAAAGCAGGATATATCACAGATAGGGGCAAAGACAAAGTAAAAGTGTTAGAACAGACTACTAATCAACAAGCAGAATTGGAAGCATTTCTCATGGCATTGACAGACTCAGGGCCAAAGGCAAATATTATAGTAGATTCACAATATGTTATGGGAATAATAACAGGATGCCCTACAGAATCAGAGAGCAGGCTAGTTAATCAAATAATAGAAGAAATGATTAAAAAGTCAGAAATTTATGTAGCATGGGTACCAGCACACAAAGGTATAGGAGGAAACCAAGAAATAGACCACCTAGTTAGTCAAGGGATTAGACAAGTTCTCTTCTTGGAAAAGATAGAGCCAGCACAAGAAGAACATGATAAATACCATAGTAATGTAAAAGAATTGGTATTCAAATTTGGATTACCCAGAATAGTGGCCAGACAGATAGTAGACACCTGTGATAAATGTCATCAGAAAGGAGAGGCTATACATGGGCAGGCAAATTCAGATCTAGGGACTTGGCAAATGGATTGTACCCATCTAGAGGGAAAAATAATCATAGTTGCAGTACATGTAGCTAGTGGATTCATAGAAGCAGAGGTAATTCCACAAGAGACAGGAAGACAGACAGCACTATTTCTGTTAAAATTGGCAGGCAGATGGCCTATTACACATCTACACACAGATAATGGTGCTAACTTTGCTTCGCAAGAAGTAAAGATGGTTGCATGGTGGGCAGGGATAGAGCACACCTTTGGGGTACCATACAATCCACAGAGTCAGGGAGTAGTGGAAGCAATGAATCACCACCTGAAAAATCAAATAGATAGAATCAGGGAACAAGCAAATTCAGTAGAAACCATAGTATTAATGGCAGTTCATTGCATGAATTTTAAAAGAAGGGGAGGAATAGGGGATATGACTCCAGCAGAAAGATTAATTAACATGATCACTACAGAACAAGAGATACAATTTCAACAATCAAAAAACTCAAAATTTAAAAATTTTCGGGTCTATTACAGAGAAGGCAGAGATCAACTGTGGAAGGGACCCGGTGAGCTATTGTGGAAAGGGGAAGGAGCAGTCATCTTAAAGGTAGGGACAGACATTAAGGTAGTACCCAGAAGAAAGGCTAAAATTATCAAAGATTATGGAGGAGGAAAAGAGGTGGATAGCAGTTCCCACATGGAGGATACCGGAGAGGCTAGAGAGGTGGCATAGCCTCATAAAATATCTGAAATATAAAACTAAAGATCTACAAAAGGTTTGCTATGTGCCCCATTTTAAGGTCGGATGGGCATGGTGGACCTGCAGCAGAGTAATCTTCCCACTACAGGAAGGAAGCCATTTAGAAGTACAAGGGTATTGGCATTTGACACCAGAAAAAGGGTGGCTCAGTACTTATGCAGTGAGGATAACCTGGTACTCAAAGAACTTTTGGACAGATGTAACACCAAACTATGCAGACATTTTACTGCATAGCACTTATTTCCCTTGCTTTACAGCGGGAGAAGTGAGAAGGGCCATCAGGGGAGAACAACTGCTGTCTTGCTGCAGGTTCCCGAGAGCTCATAAGTACCAGGTACCAAGCCTACAGTACTTAGCACTGAAAGTAGTAAGCGATGTCAGATCCCAGGGAGAGAATCCCACCTGGAAACAGTGGAGAAGAGACAATAGGAGAGGCCTTCGAATGGCTAAACAGAACAGTAGAGGAGATAAACAGAGAGGCGGTAAACCACCTACCAAGGGAGCTAATTTTCCAGGTTTGGCAAAGGTCTTGGGAATACTGGCATGATGAACAAGGGATGTCACCAAGCTATGTAAAATACAGATACTTGTGTTTAATACAAAAGGCTTTATTTATGCATTGCAAGAAAGGCTGTAGATGTCTAGGGGAAGGACATGGGGCAGGGGGATGGAGACCAGGACCTCCTCCTCCTCCCCCTCCAGGACTAGCATAAATGGAAGAAAGACCTCCAGAAAATGAAGGACCACAAAGGGAACCATGGGATGAATGGGTAGTGGAGGTTCTGGAAGAACTGAAAGAAGAAGCTTTAAAACATTTTGATCCTCGCTTGCTAACTGCACTTGGTAATCATATCTATAATCGTCACGGAGACACTCTAGAGGGAGCAGGAGAACTCATTAGAATCCTCCAACGAGCGCTCTTCATGCATTTCAGAGGCGGATGCATCCACTCCAGAATCGGCCAACCTGGGGGAGGAAATCCTCTCTCAGCTATACCGCCCTCTAGAAGCATGCGCATGCTGTAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCAGGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCCTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGCAATCTATACAAATAGAAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGTTAATTAATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAATATCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAAAACTACTTTATTCTGTGCATCAAATGCTAAAGCATATGAGAAAGAAGTACATAACATCTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTTTTGGGAAATGTAACAGAAAATTTTAACATGTGGAAAAATGACATGGTGGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACTTCACTCTGTGTCACTTTAAAGTGTAGTAATTTTACCGGGAAGAGTAATGTTACCTACAAAGGGGATATGGAAGTAAAAAATTGCTCTTTCAATGTAACCACAGAAATAAGAGATAAGAAGCAGAAAGTGTATGCTCTTTTTTATAGACTTGATATAACACCACTTGATGACAACTCTAGTGAGTATATATTAATAAATTGCAATTCCTCAACCATAACACAAGCCTGTCCAAAGGTCAATTTTGACCCAATTCCTATACATTATTGTGCTCCAGCTGGTTATGCGATTCTAAAGTGTAATAATAAGACATTTAATGGGACAGGACCATGCCATAATGTCAGTACAGTACAATGTACACATGGAATTAAGCCAGTGGTATCAACTCAACTACTGTTAAACGGTAGCCTAGCAGAAGGGGAGATAATAATTAGATCTGAAAATCTGACAGACAATGTCAAAACAATAATAGTACACTTTAATGAATCTGTAGAAATTACTTGTACAAGACCCAACAATAATACAAGAAAAAGTATAAGCATAGGACCAGGACAAGCAATCTATGCCACAGGTGATATAATAGGAGACATAAGACAAGCACACTGTAACATTAGTAAAGAAAATTGGAACAAAACTTTACAATGGGTAAGGGGAAAATTAAAAGAACACTTCCCTAATAAAACAATAGTATTTAAACCATCCTCAGGAGGGGATCTAGAAATTACAACACATAGCTTTAATTGTAGAGGAGAATTTTTCTATTGCAACACATCAAAACTGTTTAATAGTACAGACAATAGTACACACATGGGTACAGAAAATAATACAATCATCACAATCCCATGTAGAATAAAACAAATTATAAACATGTGGCAGGAGGTAGGACGAGCAATGTATGCCCCCCCCATAGAAGGAAACATAACATGTAAATCAAATATCACAGGACTACTACTGGTACGTGATGGAGGATGGGACAACAGTACAAATGACACAGAAACATTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAGGTGGTAGAAGTCAAGCCATTGGGAATAGCACCCACTAAGGCAAAAAGGAGAGTGGTGGAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCGGCGTCAATAACGCTGACGGTACAGGCCAGACAACTGTTGTCTGGTATAGTGCAGCAGCAAGACAATTTGCTGAGAGCTATAGAGGCGCAACAACATATGTTGCAACTCACAGTCTGGGGCATTAAGCAGCTCCAGGCGAGAGTCCTGGCTATAGAAAGATACCTACAGGATCAACAGCTCCTAGGGATTTGGGGCTGCTCTGGAAAACTCATCTGCACCACTGCTGTGCCTTGGAACGACAGTTGGAGTAATAAATCTCAAACAGATATTTGGGAGAACATGACCTGGATGCAGTGGGATAGAGAAATTAGTAGACACACAGACACAATATACAGGTTGCTTGAAGACTCACAAAACCAGCAGGAGAAAAATGAAAAAGATTTATTAGCATTGGACAGTTGGAAAAATTTGTGGAATTGGTTTAGCATAACAAGGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCCTGATAGGTTTGAGAATAATTTTTGCTGTGCTCTCGATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCACTTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGACCGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGACTGTGGAACTCCTGGGACGCAGAGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACTGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAACGCCACAGCCATAGCAGTAAGACAATATGGGTGGAGCTATTTCCATGAGGCGGTCCAGGCCGTCTGGAGATCTGCGACAGAGACTCTTGCGGGCGCGTGGGGAGACTTATGGGAGATTCTTAGGAGAGGTGGAAGATGGATACTCGCAATCCCCAGGAGGATTAGACAAGGGCTCGAGCTCACTCTCTTGTGAGGGACAGAAATACAATCAGGGACAGCATATGAATACTCCATGGAGAAACCCAGCTGAAGAGGGAGAAAAATTAGCATACAGAAAACAAAATATGGATGATATAGATGAGGAAGATGATGACTTGGTAGGGGTATCAGTGAGGCCAAAAGTTCTCCTAAGAACAATGAGTTACAAATTGGCAATAGACATGTCTCATTTTATAAAAGAAAAGGGGGGACTGGAAGGGATTTATTACAGTGCAAGAAGACATAGAATCTTAGACATATACTTAGAAAAGGAAGAAGGCATCATACCAGATTGGCAGGATTACACCTCAGGACCAGGAATTAGATACCCAAAGACATTTGGCTGGCTATGGAAATTAGTCCCTGTAGATGTATCAGATGAGGCACAGGAGGATGAGGAGCATTACTTAATGCATCCAGCTCAAACTTCCCAGTGGGATGACCCTTGGGGAGAGGTTCTAGCATGGAAGTTTGATCCAACTCTGGCCTACACTTATGAGGCATATGTTAGATACCCAGAAGAGTTTGGAAGCAAGTCAGGCCTGTCAGAGGAAGAGGTTAGAAGAAGGCTAACCGCAAGAGGCCTTCTTAACATGGCTGACAAGAAGGAAACTCGCTGAAACAGCAGGGACTTTCCACAAAGGGACTTTCCACAAGGGGATGTTACGGGGAGGTACTGGGGAGGAGCCGGTCGGGAACGCCCACTTTCTTGATGTATAAATATCACTGCATTTCGCTCTGTATTCAGTCGCTCTGCGGAGAGGCTGGCAGATTGAGCCCTGGGAGGTTCTCTCCAGCACTAGCAGGTAGAGCCTGGGTGTTCCCTGCTAGACTCTCACCAGCACTTGGCCGGTGCTGGGCAGAGTGACTCCACGCTTGCTTACTTAAAGCCCTCTTCAATAAAGCTGCCATTTAGAAGTA')
;
-- ----------------------------
-- Table structure for sequenceAnalysis.ref_aa_sequences
-- ----------------------------
CREATE TABLE sequenceAnalysis.ref_aa_sequences
(
RowId serial NOT NULL,
Ref_nt_id INTEGER NOT NULL,
Name VARCHAR(255) NOT NULL,
Exons VARCHAR(255) DEFAULT NULL,
Start_location INTEGER DEFAULT NULL,
Sequence text NOT NULL,
Comments text DEFAULT NULL,
status BOOLEAN DEFAULT TRUE,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_ref_aa_sequences PRIMARY KEY (rowId),
CONSTRAINT UNIQUE_ref_aa_sequences UNIQUE (ref_nt_id, name),
CONSTRAINT fk_ref_aa_sequences_ref_nt_id FOREIGN KEY (ref_nt_id)
REFERENCES sequenceanalysis.ref_nt_sequences (rowid) MATCH SIMPLE
ON UPDATE NO ACTION ON DELETE NO ACTION
);
-- ----------------------------
-- Data for sequenceAnalysis.ref_aa_sequences
-- ----------------------------
INSERT INTO sequenceAnalysis.ref_aa_sequences
(exons, start_location, sequence, name, ref_nt_id) VALUES
('1309-2841', '1309', 'MGVRNSVLSGKKADELEKIRLRPNGKKKYMLKHVVWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTTETMPKTSRPTAPSSGRGGNYPVQQIGGNYVHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGDHQAAMQIIRDIINEEAADWDLQHPQPAPQQGQLREPSGSDIAGTTSSVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDAAVKNWMTQTLLIQNANPDCKLVLKGLGVNPTLEEMLTACQGVGGPGQKARLMAEALKEALAPVPIPFAAAQQRGPRKPIKCWNCGKEGHSARQCRAPRRQGCWKCGKMDHVMAKCPDRQAGFLGLGPWGKKPRNFPMAQVHQGLMPTAPPEDPAVDLLKNYMQLGKQQREKQRESREKPYKEVTEDLLHLNSLFGGDQ*', 'Gag', '1'),
('2484-5666', '2484', 'VLELWERGTLCKAMQSPKKTGMLEMWKNGPCYGQMPRQTGGFFRPWSMGKEAPQFPHGSSASGADANCSPRGPSCGSAKELHAVGQAAERKAERKQREALQGGDRGFAAPQFSLWRRPVVTAHIEGQPVEVLLDTGADDSIVTGIELGPHYTPKIVGGIGGFINTKEYKNVEIEVLGKRIKGTIMTGDTPINIFGRNLLTALGMSLNFPIAKVEPVKVALKPGKDGPKLKQWPLSKEKIVALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNRVTQDFTEVQLGIPHPAGLAKRKRITVLDIGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRHVLEPFRKANPDVTLVQYMDDILIASDRTDLEHDRVVLQSKELLNSIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKIHQEDKILKVGKFAKIKNTHTNGVRLLAHVIQKIGKEAIVIWGQVPKFHLPVEKDVWEQWWTDYWQVTWIPEWDFISTPPLVRLVFNLVKDPIEGEETYYTDGSCNKQSKEGKAGYITDRGKDKVKVLEQTTNQQAELEAFLMALTDSGPKANIIVDSQYVMGIITGCPTESESRLVNQIIEEMIKKSEIYVAWVPAHKGIGGNQEIDHLVSQGIRQVLFLEKIEPAQEEHDKYHSNVKELVFKFGLPRIVARQIVDTCDKCHQKGEAIHGQANSDLGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFASQEVKMVAWWAGIEHTFGVPYNPQSQGVVEAMNHHLKNQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLINMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTDIKVVPRRKAKIIKDYGGGKEVDSSSHMEDTGEAREVA*', 'Pol', '1'),
('5596-6240', '5596', 'MEEEKRWIAVPTWRIPERLERWHSLIKYLKYKTKDLQKVCYVPHFKVGWAWWTCSRVIFPLQEGSHLEVQGYWHLTPEKGWLSTYAVRITWYSKNFWTDVTPNYADILLHSTYFPCFTAGEVRRAIRGEQLLSCCRFPRAHKYQVPSLQYLALKVVSDVRSQGENPTWKQWRRDNRRGLRMAKQNSRGDKQRGGKPPTKGANFPGLAKVLGILA*', 'Vif', '1'),
('6068-6406', '6068', 'MSDPRERIPPGNSGEETIGEAFEWLNRTVEEINREAVNHLPRELIFQVWQRSWEYWHDEQGMSPSYVKYRYLCLIQKALFMHCKKGCRCLGEGHGAGGWRPGPPPPPPPGLA*', 'vpX', '1'),
('6407-6712', '6407', 'MEERPPENEGPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNHIYNRHGDTLEGAGELIRILQRALFMHFRGGCIHSRIGQPGGGNPLSAIPPSRSML*', 'vpR', '1'),
('6558-6853;9062-9158', '6558', 'METPLREQENSLESSNERSSCISEADASTPESANLGEEILSQLYRPLEACYNTCYCKKCCYHCQFCFLKKGLGICYEQSRKRRRTPKKAKANTSSASNKPISNRTRHCQPEKAKKETVEKAVATAPGLGR*', 'Tat', '1'),
('6784-6853;9062-9315', '6784', 'MSNHEREEELRKRLRLIHLLHQTNPYPTGPGTANQRRQRKRRWRRRWQQLLALADRIYSFPDPPTDTPLDLAIQQLQNLAIESIPDPPTNTPEALCDPTEDSRSPQD*', 'Rev', '1'),
('6860-9499', '6860', 'MGCLGNQLLIAILLLSVYGIYCTLYVTVFYGVPAWRNATIPLFCATKNRDTWGTTQCLPDNGDYSEVALNVTESFDAWNNTVTEQAIEDVWQLFETSIKPCVKLSPLCITMRCNKSETDRWGLTKSITTTASTTSTTASAKVDMVNETSSCIAQDNCTGLEQEQMISCKFNMTGLKRDKKKEYNETWYSADLVCEQGNNTGNESRCYMNHCNTSVIQESCDKHYWDAIRFRYCAPPGYALLRCNDTNYSGFMPKCSKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRDNRTIISLNKYYNLTMKCRRPGNKTVLPVTIMSGLVFHSQPINDRPKQAWCWFGGKWKDAIKEVKQTIVKHPRYTGTNNTDKINLTAPGGGDPEVTFMWTNCRGEFLYCKMNWFLNWVEDRNTANQKPKEQHKRNYVPCHIRQIINTWHKVGKNVYLPPREGDLTCNSTVTSLIANIDWIDGNQTNITMSAEVAELYRLELGDYKLVEITPIGLAPTDVKRYTTGGTSRNKRGVFVLGFLGFLATAGSAMGAASLTLTAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTKNLQTRVTAIEKYLKDQAQLNAWGCAFRQVCHTTVPWPNASLTPKWNNETWQEWERKVDFLEENITALLEEAQIQQEKNMYELQKLNSWDVFGNWFDLASWIKYIQYGVYIVVGVILLRIVIYIVQMLAKLRQGYRPVFSSPPSYFQQTHIQQDPALPTREGKERDGGEGGGNSSWPWQIEYIHFLIRQLIRLLTWLFSNCRTLLSRVYQILQPILQRLSATLQRIREVLRTELTYLQYGWSYFHEAVQAVWRSATETLAGAWGDLWETLRRGGRWILAIPRRIRQGLELTLL*', 'Env', '1'),
('9333-10124', '9333', 'MGGAISMRRSRPSGDLRQRLLRARGETYGRLLGEVEDGYSQSPGGLDKGLSSLSCEGQKYNQGQYMNTPWRNPAEEREKLAYRKQNMDDIDEEDDDLVGVSVRPKVPLRTMSYKLAIDMSHFIKEKGGLEGIYYSARRHRILDIYLEKEEGIIPDWQDYTSGPGIRYPKTFGWLWKLVPVNVSDEAQEDEEHYLMHPAQTSQWDDPWGEVLAWKFDPTLAYTYEAYVRYPEEFGSKSGLSEEEVRRRLTARGLLNMADKKETR*', 'Nef', '1'),
('1041-2561', '1054', 'MGARNSVLSGKKADELEKIRLRPGGKKKYMLKHVVWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTAETMPKTSRPTAPSSGRGGNYPVQQIGGNYVHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGDHQAAMQIIRDIINEEAADWDLQHPQPAPQQGQLREPSGSDIAGTTSSVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDAAVKNWMTQTLLIQNANPDCKLVLKGLGVNPTLEEMLTACQGVGGPGQKARLMAEALKEALAPVPIPFAAAQKRGPRKPIKCWNCGKEGHSARQCRAPRRQGCWKCGKMDHVMAKCPDRQAGFLGLGPWGKKPRNFPMAQVHQGLTPTAPPEDPAVDLLKNYMQLGKQQRESREKPYKEVTEDLLHLNSLFGGDQ*', 'Gag', '2'),
('218-1741', '218', 'MGARNSVLSGKKADELEKIRLRPNGKKKYMLKHXVWAANELDRFGLAESLLDNKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTADKMPATSRPTAPPSGRGGNYPVQQXGGNYVHLPLSPRTLNAWVKLVEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGEHQAAMQIIREIINEEAADWDLQHPQPGPLPAGQLREPRGSDIAGTTSTVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDPAVKNWMTQTLLIQNANPDCKLVLKGLGMNPTLEEMLTACQGIGGPGQKARLMAEALKEALRPDQLPFAAVQQKGQRRTIKCWNCGKEGHSARQCRAPRRQGCWXCGXTGHVMAKCPERQAGFLGLGPWGKKPRNFPMAQMPQGLIPTAPPEDPAVDLLKNYMKMGRKQRENRERPYKEVTEDLLHLNSLFGEDQ*', 'Gag', '4'),
('1507-4566', '1507', 'KTGGFFRAWPMGKEAPQFPHGPDASGADTNCSPRGSSCGSTEELHEDGQKAEGEQRETLQGGDRGFAAPQFSLWRRPVVTAYIEEQPVEVLLDTGADDSIVAGIELGPNYTPKVVGGIGGFINTKEYKDVKIKVLGKVIKGTIMTGDTPINIFGRNLLTAMGMSLNLPIAKVEPIKVTLKPGKEGPKLRQWPLSKEKIIALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNKVTQDFTEVQLGIPHPAGLAKRRRITVLDVGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRNVLEPFRKANPDVTLIQYMDDILIASDRTDLEHDRVVLQLKELLNGIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPIEATVIKSQDNQWSYKIHQEDKVLKVGKFAKVKNTHTNGVRLLAHVVQKIGKEALVIWGEVPKFHLPVEREIWEQWWTDYWQVTWIPDWDFVSTPPLVRLVFNLVKEPIQGAETFYVDGSCNRQSREGKAGYVTDRGRDKAKLLEQTTNQQAELEAFYLALXDSGPKANIIVDSQYVMGIIAGQPTESESRLVNQIIEEMIKKEAIYVAWVPAHKGIGGNQEVDHLVSQGIRQVLFLEKIEPAQEEHEKYHSNVKELVFKFGLPRLVAKQIVDTCDKCHQKGEAIHGQVNAELGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFTSQEVKMVAWWAGIEQTFGVPYNPQSQGVVEAMNHHLKTQIDRIREQANSIETIVLMAVHCMNFKRRGGIGDMTPAERLVNMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTEIKVVPRRKAKIIKDYGGGKELDSGSHLEDTGEAREVA*', 'Pol', '4'),
('4496-5140', '4496', 'MEEEKNWIVVPTWRIPERLERWHSLIKHLKYNTKDLQMACYVPHHKVGWAWWTCSRVIFPLRDETHLEVQGYWNLAPEKGWLSTHAVRITWYSRNFWTDVTPDYADTLLHSTYFPCFSEGEVRRAIRGEKLLSCCKFPKAHKNQVPSLQYLALTVVSHVRSQGEDPTWKQWGRNNRRXLRMAKQNSRRNKQGSSKSPAEGANFPGLAKVLGILA*', 'Vif', '4'),
('4968-5306', '4968', 'MSDPRERIPPGNSGEETIEEAFEWLNRTVEGINRAAVNHLPRELIFQVWRRSWEYWHDXMGMSESYTKYRYLCLIQKALFVHCKKGCRCLGEXHGAGGWRTGPPPPPPPGLA*', 'vpX', '4'),
('5308-5613', '5308', 'MAERPPEDEAPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNYIYDRHGDTLEGAGELIRILQRALFIHFRSGCAHSRIGQSRGGNPLSTIPPSRDML*', 'vpR', '4'),
('5755-8418', '5755', 'MGCLGNQLLIALLLVSALEIYCVQYVTVFYGVPAWKNATIPLFCTTRNRDTWGTTQCLPDNDDYSELAIXITEAFDAWNNTVTEQAIEDVWNLFETSIKPCVKLTPLCIAMRCNKTETDRWGLTRNAGTTTTTTTTTTAATPSVAENVINESNPCIKNNSCAGLEQEPMIGCKFNMTGLKRDKRIEYNETWYSRDLICEQSANESESKCYMHHCNTSVIQESCDKHYWDAIRFRYCAPPGYALLRCNDSNYSGFAPNCSKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGKSNRTIISLNKYYNLTMRCRRPGNKTVLPVTIMSGLVFHSQPINERPKQAWCWFGGSWKEAIQEVKETLVKHPRYTGTNDTKKINLTAPAGGDPEVTFMWTNCRGEFLYCKMNWFLNWVEDRDQKXSRWRQQNTRERQKKNYVPCHIRQIINTWHKVGKNVYLPPREGDLTCNSTVTSLIAEIDWTNNNETNITMSAEVAELYRLELGDYKLVEITPIGLAPTSVRRYTTTGASRNKRGVFVLGFLGFLATAGSAMGAASLTLSAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTKNLQTRVTAIEKYLKDQAQLNSWGCAFRQVCHTTVPWPNETLVPNWSNMTWQEWERQVDFLEANITQLLEEAQIQQEKNMYELQKLNSWDIFGNWFDLTSWIRYIQYGVLIVLGVVGLRIVIYVVQMLARLRQGYRPVFSSPPAYVQQIPIHKGQEPPTKEGEEGEGGDRGGNRSWPWQIEYIHFLIRQLIRLLTWLFSSCRDWLLRXYQXLQPVLQSLSTTXQRVREVIRIGIAYLQYGWRYFQEAVQAWWKFARETLASAWRDIWETLGRVGRGILAIPRRXRQGXELXLL*', 'Env', '4'),
('5450-5748;7978-8077', '5450', 'MIDMETPLKEQENSLESCREHSSSISEVDVPTPESANLEEEILYQLYRPLETCYNKCYCKRCCYHCQHCFLKKGLGICYEQHRRRTPKKTKANPLPASNQIPIHKGQEPPTKEGEEGEGGDRGGNRSWPWQI*', 'Tat', '4'),
('5685-5748;7978-8219', '5685', 'MSSTEEELRKRLRLIHFLHQTTDPYPQGPGTANQRRRRRRRWRQRWQQILALADRIYSFPNPPTDTPLDLAIQQLQGLAIEDLPXPPTSXPEPLNDVAKSP*', 'Rev', '4'),
('8252-9043', '8252', 'MGGVISKKQCRRGGNLRERLLQARGETYGRLWEGLEEGYSQSXGASGKGLSSLSCEPQKYSEGQYMNTPWRNPAAERAKLGYRQQNMDDVDDEDDDLVXVSVHPRVPLRAMTYKLAIDMSHFIKEKGGLEGIYYNEKRHRILDMYMEKEEGIIPDWQNYTSGPGTRYPMYYGWLWKLVPVDVSDEAQEDETHCLMHPAQTHQWDDPWGEVLAWKFDPELAYSYKAFIKYPEEFGSKSXLSEEEVKRRLTARGLIKMADKKETS*', 'Nef', '4'),
('536-2068', '536', 'MGVRNSVLSGKKADELEKIRLRPNGKKKYMLKHVVWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTTETMPKTSRPTAPSSGRGGNYPVQQIGGNYVHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGDHQAAMQIIRDIINEEAADWDLQHPQPAPQQGQLREPSGSDIAGTTSSVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDAAVKNWMTQTLLIQNANPDCKLVLKGLGVNPTLEEMLTACQGVGGPGQKARLMAEALKEALAPVPIPFAAAQQRGPRKPIKCWNCGKEGHSARQCRAPRRQGCWKCGKMDHVMAKCPDRQAGFLGLGPWGKKPRNFPMAQVHQGLMPTAPPEDPAVDLLKNYMQLGKQQREKQRESREKPYKEVTEDLLHLNSLFGGDQ*', 'Gag', '3'),
('1714-4893', '1711', 'LELWERGTLCKAMQSPKKTGMLEMWKNGPCYGQMPRQTGGFFRPWSMGKEAPQFPHGSSASGADANCSPRGPSCGSAKELHAVGQAAERKAERKQREALQGGDRGFAAPQFSLWRRPVVTAHIEGQPVEVLLDTGADDSIVTGIELGPHYTPKIVGGIGGFINTKEYKNVEIEVLGKRIKGTIMTGDTPINIFGRNLLTALGMSLNFPIAKVEPVKVALKPGKDGPKLKQWPLSKEKIVALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNRVTQDFTEVQLGIPHPAGLAKRKRITVLDIGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRHVLEPFRKANPDVTLVQYMDDILIASDRTDLEHDRVVLQSKELLNSIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKIHQEDKILKVGKFAKIKNTHTNGVRLLAHVIQKIGKEAIVIWGQVPKFHLPVEKDVWEQWWTDYWQVTWIPEWDFISTPPLVRLVFNLVKDPIEGEETYYTDGSCNKQSKEGKAGYITDRGKDKVKVLEQTTNQQAELEAFLMALTDSGPKANIIVDSQYVMGIITGCPTESESRLVNQIIEEMIKKSEIYVAWVPAHKGIGGNQEIDHLVSQGIRQVLFLEKIEPAQEEHDKYHSNVKELVFKFGLPRIVARQIVDTCDKCHQKGEAIHGQANSDLGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFASQEVKMVAWWAGIEHTFGVPYNPQSQGVVEAMNHHLKNQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLINMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTDIKVVPRRKAKIIKDYGGGKEVDSSSHMEDTGEAREVA*', 'Pol', '3'),
('4823-5467', '4823', 'MEEEKRWIAVPTWRIPERLERWHSLIKYLKYKTKDLQKVCYVPHFKVGWAWWTCSRVIFPLQEGSHLEVQGYWHLTPEKGWLSTYAVRITWYSKNFWTDVTPNYADILLHSTYFPCFTAGEVRRAIRGEQLLSCCRFPRAHKYQVPSLQYLALKVVSDVRSQGENPTWKQWRRDNRRGLRMAKQNSRGDKQRGGKPPTKGANFPGLAKVLGILA*', 'Vif', '3'),
('5295-5633', '5295', 'MSDPRERIPPGNSGEETIGEAFEWLNRTVEEINREAVNHLPRELIFQVWQRSWEYWHDEQGMSPSYVKYRYLCLIQKALFMHCKKGCRCLGEGHGAGGWRPGPPPPPPPGLA*', 'vpX', '3'),
('5634-5939', '5634', 'MEERPPENEGPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNHIYNRHGDTLEGAGELIRILQRALFMHFRGGCIHSRIGQPGGGNPLSAIPPSRSML*', 'vpR', '3'),
('5948-6162;8487-8580', '5948', 'MEPVDPRLEPWKHPGSKPKTACTNCYCKKCCFHCQVCFTTKALGISYGRKKRRQRRRAHQNSQTHQASLSKQPSSQPRGDPTGPKEQKKKVERETETDPVHQ*', 'Tat', '3'),
('6087-6162;8487-8761', '6087', 'MAGRSGDSDEELIRTVRLIKLLYQSNPPPSLEGTRQARRNRRRRWRERQRQIRSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE*', 'Rev', '3'),
('6179-6424', '6179', 'MQPIQIAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL*', 'vpU', '3'),
('6339-8948', '6339', 'MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWREATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNNMVDQMHEDIISLWDESLKPCVKLTPLCVTLNCTNLNITKNTTNLTSSSWGMMEEGEIKNCSFYITTSIRNKVKKEYALFNRLDVVPVKNTSNTKYRLISCNTSVITQACPKVSFQPIPIHYCVPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDIVIRSEDFTDNVKTIIVQLNESVVINCTRPNNNTRERLSIGPGRAFYARRNIIGDIRQAHCNISRAKWNNTLQQIVIKLREKFRNKTIAFNQSSGGDPEIVMHSFNCGGEFFYCNTAQLFNSTWNVAGGTNGTEGNDIITLQCRIKQIINMWQKVGKAMYAPPITGQIRCSSNITGLLLTRDGGNSTETETEIFRPGGGDMRDNWRSELYKYKVVRIEPIGVAPTRAKRRTVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQNMLRLTVWGIKQLQARVLALERYLRDQQLMGIWGCSGKLICTTSVPWNVSWSNKSVDDIWNNMTWMEWEREIDNYTDYIYDLLEKSQTQQEKNEKELLELDKWASLWNWFDITNWLWYIRLFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSFQTLLPASRGPDRPEGTEEEGGERDRDRSGPSVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLQYGWSYFHEAVQAVWRSATETLAGAWGDLWETLRRGGRWILAIPRRIRQGLELTLL*', 'Env', '3'),
('8782-9573', '8782', 'MGGAISMRRSRPSGDLRQRLLRARGETYGRLLGEVEDGYSQSPGGLDKGLSSLSCEGQKYNQGQYMNTPWRNPAEEREKLAYRKQNMDDIDEEDDDLVGVSVRPKVPLRTMSYKLAIDMSHFIKEKGGLEGIYYSARRHRILDIYLEKEEGIIPDWQDYTSGPGIRYPKTFGWLWKLVPVNVSDEAQEDEEHYLMHPAQTSQWDDPWGEVLAWKFDPTLAYTYEAYVRYPEEFGSKSGLSEEEVRRRLTARGLLNMADKKETR*', 'Nef', '3'),
('2216-5386', '2229', 'VLELWEGGTLCKAMQSPKKTGMLEMWKNGPCYGQMPRQTGGFFRPWSMGKEAPQFPHGSSASGADANCSPRGPSCGSAKELHAVGQAAERKQREALQGGDRGFAAPQFSLWRRPVVTAHIEGQPVEVLLDTGADDSIVTGIELGPHYTPKIVGGIGGFINTKEYKNVKIEVLGKRIKGTIMTGDTPINIFGRNLLTALGMSLNLPIAKVEPVKVTLKPGKVGPKLKQWPLSKEKIVALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNRVTQDFTEVQLGIPHPAGLAKRKRITVLDIGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRHVLEPFRKANPDVTLVQYMDDILIASDRTDLEHDRVVLQLKELLNSIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKIHQEDKILKVGKFAKIKNTHTNGVRLLAHVIQKIGKEAIVIWGQVPKFHLPVERDVWEQWWTDYWQVTWIPEWDFISTPPLVRLVFNLVKDPIEGEETYYTDGSCNKQSKEGKAGYITDRGKDKVKVLEQTTNQQAELEAFLMALTDSGPKTNIIVDSQYVMGIITGCPTESESRLVNQIIEEMIKKSEIYVAWVPAHKGIGGNQEIDHLVSQGIRQVLFLEKIEPAQEEHDKYHSNVKELVFKFGLPRIVARQIVDTCDKCHQKGEAIHGQVNSDLGTWQMDCTHLEGKIVIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFASQEVKMVAWWAGIEHTFGVPYNPQSQGVVEAMNHHLKNQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLINMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTDIKVVPRRKAKIIKDYGGGKEVDSSSHMEDTGEAREVA*', 'Pol', '2'),
('5316-5960', '5316', 'MEEEKRWIAVPTWRIPERLERWHSLIKYLKYKTKDLQKVCYVPHFKVGWAWWTCSRVIFPLQEGSHLEVQGYWHLTPERGWLSTYAVRITWYSRNFWTDVTPDYADILLHSTYFPCFTAGEVRRAIRGEQLLSCCKFPRAHRYQVPSLQYLALKVVSDVRSQGENPTWKQWRRDNRRGLRMAKQNSRGDKQRGSKPPTKGADFPGLAKVLGILA*', 'Vif', '2'),
('5788-6126', '5801', 'MSDPRERIPPGNSGEETIGEAFEWLNRTVEEINREAVNHLPRELIFQVWQRSWEYWHDEQGMSQSYVKYRYLCLMQKALFMHCKKGCRCLGEGHGAGGWRPGPPPPPPPGLA*', 'vpX', '2'),
('6127-6420', '6140', 'MEERPPENEGPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNHIYNRHGDTLEGAGELIRILQRALFMHFRGGCNHSRIGQPGGGNPLSTIPPS*', 'vpR', '2'),
('6278-6573;8785-8884', '6291', 'METPLREQENSLESSNERSSCILEADATTPESANLGEEILSQLYRPLEACYNTCYCKKCCYHCQFCFLKKGLGICYEQSRKRRRTPKKAKANTSSASNNRLIPNRTRHCQPEKAKKETVEKAVATAPGLGR*', 'Tat', '2'),
('6504-6573;8785-9041', '6517', 'MSSHEREEELRKRLRLIHLLHQTIDSYPTGPGTANQRRQRRRRWRRRWQQLLALADRIYSFPDPPTDTPLDLAIQQLQNLAIESIPDPPTNTPEALCDPTKGSRSPQD*', 'Rev', '2'),
('9059-9802', '9072', 'MGGAISMRRSKPAGDLRQKLLRARGETYGRLLGEVEDGSSQSLGGLGKGLSSRSCEGQKYNQGQYMNTPWRNPAEEKEKLAYRKQNMDDIDEEDDDLVGVSVRPKVPLRAMTYKLAIDMSHFIKEKGGLEGIYYSARRHRILDMYLEKEEGIIPDWQDYTSGPGIRYPKTFGWLWKLVPVNVSDEAQEDERHYLMQPAQTSKWDDPWGEVLAWKFDPTLAYTYEAYARYPEELEASQACQRKRLEEG*', 'Nef', '2'),
('6580-9225', '6593', 'MGCLGNQLLIAILLLSVYGIYCTQYVTVFYGVPAWRNATIPLFCATKNRDTWGTTQCLPDNGDYSELALNVTESFDAWENTVTEQAIEDVWQLFETSIKPCVKLSPLCITMRCNKSETDRWGLTKSSTTITTAAPTSAPVSEKIDMVNETSSCIAQNNCTGLEQEQMISCKFTMTGLKRDKTKEYNETWYSTDLVCEQGNSTDNESRCYMNHCNTSVIQESCDKHYWDTIRFRYCAPPGYALLRCNDTNYSGFMPKCSKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRDNRTIISLNKYYNLTMKCRRPGNKTVLPVTIMSGLVFHSQPINDRPKQAWCWFGGKWKDAIKEVKQTIVKHPRYTGTNNTDKINLTAPGGGDPEVTFMWTNCRGEFLYCKMNWFLNWVEDRDVTTQRPKERHRRNYVPCHIRQIINTWHKVGKNVYLPPREGDLTCNSTVTSLIANIDWTDGNQTSITMSAEVAELYRLELGDYKLVEITPIGLAPTDVKRYTTGGTSRNKRGVFVLGFLGFLATAGSAMGAASLTLTAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTKNLQTRVTAIEKYLKDQAQLNAWGCAFRQVCHTTVPWPNASLTPDWNNDTWQEWERKVDFLEENITALLEEAQIQQEKNMYELQKLNSWDVFGNWFDLASWIKYIQYGIYVVVGVILLRIVIYIVQMLAKLRQGYRPVFSSPPSYFQ*THTQQDPALPTREGKEGDGGEGGGNSSWPWQIEYIHFLIRQLIRLLTWLFSNCRTLLSRAYQILQPILQRLSATLRRVREVLRTELTYLQYGWSYFHEAVQAGWRSATETLAGAWRDLWETLRRGGRWILAIPRRIRQGLELTLL*', 'Env', '2'),
('336-1838', '336', 'MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALDKIEEEQNKSKKKAQQAAADTGHSNQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHTARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPPQKQEPIDKELYPLTSLRSLFGNDPSSQ*', 'Gag', '5'),
('5377-5591;7925-7970', '5377', 'MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQPTSQPRGDPTGPKE*', 'Tat', '5'),
('5516-5591;7925-8199', '5516', 'MAGRSGDSDEELIRTVRLIKLLYQSNPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE*', 'Rev', '5'),
('5608-5856', '5608', 'MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL*', 'Vpu', '5'),
('5771-8341', '5771', 'MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL*', 'Env', '5'),
('8343-8963', '8343', 'MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*', 'Nef', '5'),
('4587-5165', '4587', 'MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYESPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*', 'Vif', '5'),
('5105-5341', '5105', 'MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFQNWVST*', 'Vpr', '5'),
('1309-2841', '1309', 'MGARNSVLSGKKADELEKIRLRPGGKKKYMLKHVVWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTAETMPKTSRPTAPSSGRGGNYPVQQIGGNYVHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGDHQAAMQIIRDIINEEAADWDLQHPQPAPQQGQLREPSGSDIAGTTSSVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDAAVKNWMTQTLLIQNANPDCKLVLKGLGVNPTLEEMLTACQGVGGPGQKARLMAEALKEALAPVPIPFAAAQQRGPKKPIKCWNCGKEGHSARQCRAPRRQGCWKCGKMDHVMAKCPDRQAGFLGLGPWGKKPRNFPMAQVHQGLTPTAPPEDPAVDLLKNYMQLGKQQREKQRESREKPYKEVTEDLLHLNSLFGGDQ*', 'Gag', '6'),
('2484-5666', '2484', 'MLELWERRTLCKAMQSPKKTGMLEMWKNGPCYGQMPRQTGGFFRPWSMGKEAPQFPHGSSASGADANCSPRGPSCGSAKELHAVGQAAERKAERKQREALQGGDRGFAAPQFSLWRRPVVTAHIEGQPVEVLLDTGADDSIVTGIELGPHYTPKIVGGIGGFINTKEYKNVEIEVLGKRIKGTIMTGDTPINIFGRNLLTALGMSLNLPIAKVEPVKVALKPGKVGPKLKQWPLSKEKIVALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNRVTQDFTEVQLGIPHPAGLAKRKRITVLDIGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRHVLEPFRKANPDVTLVQYMDDILIASDRTDLEHDRVVLQLKELLNSIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKMHQEDKILKVGKFAKIKNTHTNGVRLLAHVIQKIGKEAIVIWGQVPKFHLPVERDVWEQWWTDYWQVTWIPEWDFISTPPLVRLVFNLVKDPIEGEETYYTDGSCNKQSKEGKAGYITDRGKDKVKVLEQTTNQQAELEAFLMALTDSGPKANIIVDSQYVMGIITGCPTESESRLVNQIIEEMIKKSEIYVAWVPAHKGIGGNQEIDHLVSQGIRQVLFLEKIEPAQEEHDKYHSNVKELVFKFGLPRIVARQIVDTCDKCHQKGEAIHGQVNSDLGTWQMDCTHLEGKIVIVAVHVASGFIEAEVIPQETGRQTALFLLKLASRWPVTHLHTDNGANFASQEVKMVAWWAGIEHTFGVPYNPQSQGVVEAMNHHLKNQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLINMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTDIKVVPRRKAKIIKDYGGGKEVDSSSHMEDTGEAREVA*', 'Pol', '6'),
('5596-6240', '5596', 'MEEEKRWIAVPTWRIPERLERWHSLIKYLKYKTKDLQKVCYVPHYKVGWAWWTCSRVIFPLQEGSHLEVQGYWHLTPERGWLSTYAVRITWYSRNFWTDVTPDYADILLHSTYFPCFTAGEVRRAIRGEQLLSCCRFPRAHKNQVPSLQYLALRVVSDVRSQGENPTWKQWRRDNRRGLRMAKQNSRGDKQRGGKPPTKGANFPGLAKVLGILA*', 'Vif', '6'),
('6068-6406', '6068', 'MSDPRERIPPGNSGEETIGEAFEWLNRTVEEINREAVNHLPRELIFQVWQRSWEYWHDEQGMSPSYVKYRYLCLIQKALFMHCKKGCRCLGEGHGAGGWRPGPPPPPPPGLA*', 'vpX', '6'),
('6407-6700', '6407', 'MEERPPENEGPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNHIYNRHGDTLEGAGELIRILQRALFMHFRGGCNHSRIGQPGGGNPLSTIPPS*', 'vpR', '6'),
('6558-6853;9065-9164', '6558', 'METPLREQENSLESSNERSSCISEADATTPESANLGEEILSQLYRPLEACYNTCYCKKCCYHCQFCFLKKGLGICYEQSRKRRRTPKKAKANTSSASNNRSIPNRTRHCQPEKAKKETVEKAVATAPGLGR*', 'Tat', '6'),
('6784-6853;9065-9321', '6784', 'MSSHEREEELRKRLRLIHLLHQTTDPYPTGPGTANQRRQRRRRWRRRWQQLLALADRIYSFPDPPTDTPLDLAIQQLQNLAIESIPDPPTNTPGALCDPTENSRSPQD*', 'Rev', '6'),
('25-2175', '25', 'MEDFVRQCFNPMIVELAEKAMKEYGEDLKIETNKFAAICTHLEVCFMYSDFHFINEQGESIIVEPEDPNALLKHRFEIIEGRDRTMAWTVVNSICNTTGAEKPKFLPDLYDYKENRFIEIGVTRREVHIYYLEKANKIKSEKTHIHIFSFTGEEMATKADYTLDEESRARIKTRLFTIRQEMASRGLWDSFRQSERGEETIEERFEITGTMRRLADQSLPPNFSCIENFRAYVDGFEPNGYIEGKLSQMSKEVNARIEPFLKTTPRPIRLPDGPPCFQRSKFLLMDSLKLSIEDPNHEGEGIPLYDAIKCMRTFFGWKEPSVVKPHEKGINPNYLLSWKQVLEELQDIESEEKIPRTKNMKKTSQLKWALGENMAPEKVDFDDCKDISDLKQYDSDEPELRSFSSWIQNEFNKACELTDSIWIELDEIGEDVAPIEHIASMRRNYFTAEVSHCRATEYIMKGVYINTALLNASCAAMDDFQLIPMISKCRTKEGRRKTNLYGFIIKGRSHLRNDTDVVNFVSMEFSLTDPRLEPHKWEKYCVLEIGDMLLRSAIGQVSRPMFLYVRTNGTSKIKMKWGMEMRRCLLQSLQQIESMIEAESSVKEKDMTKEFFENRSETWPIGESPKGVEEGSIGKVCRTLLAKSVFNSLYASPQLEGFSAESRKLLLIVQALRDNLEPGTFDIGGLYEAIEECLINDPWVLLNASWFNSFLTHALR*', 'PA', '7'),
('6860-9505', '6860', 'MGCLGNQLLIAILLLSVYGIYCTQYVTVFYGVPAWRNATIPLFCATKNRDTWGTTQCLPDNXDYSELAXNVTESFDAWENTVTEQAIEDVWQLFETSIKPCVKLSPLCITMRCNKSETDKWGLTKSSTTTTASTTRTTSAKIDMVNETSSCITHNNCTGLEQEQMISCKFNMTGLKRDKKKEYNETWYSTDLVCEQGNSTDNESRCYMNHCNTSVIQESCDKHYWDTIRFRYCAPPGYALLRCNDTNYSGFMPKCSKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRDNRTIISLNKYYNLTMKCRRPGNKTVLPVTIMSGLVFHSQPINDRPKQAWCWFGGNWKDAIKEVKQTIVKHPRYTGTNNTDKINLTAPRGGDPEVTFMWTNCRGEFLYCKMNWFLNWVEDRNLTLTTQKLRERHKRNYVPCHIRQIINTWHKVGKNVYLPPREGDLTCNSTVTSLIANIDWTDGNQTNITMSAEVAELYRLELGDYKLVEITPIGLAPTDVKRYTTGGTSRNKRGVFVLGFLGFLATAGSAMGAASLTLTAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTKNLQTRVTAIEKYLKDQAQLNAWGCAFRQVCHTTVPWPNASLTPDWNNDTWQEWERKVDFLEENITALLEEAQIQQEKNMYELQKLNSWDVFGNWFDLASWIRYIQYGIYIVVGVILLRIVIYIVQMLAKLRQGYRPVFSSPPSYSQQIHTQQDPALPTREGKEGDGGEGGGNSSWPWQIEYIHFLIRQLIRLLTWLFSNCRTLLSRVYQILQPILQGLSATLRRIREVLRTELTYLQYGWSYFHEAVQAGWRSATETLAGAWGDLWETLRRGGRWILAIPRRIRQGLELTLL*', 'Env', '6'),
('9339-10130', '9339', 'MGGAISMRRSKPAGDLRQRLLRARGETYGRLLGEVEDGSSQSLGGLDKGLSSLSCEGQKYNQGQYMNTPWRNPAEEREKLAYRKQNMDDVDEEDDDLVGVPVMPRVPLRTMSYKLAIDMSHFIKEKGGLEGIYYSARRHRILDMYLEKEEGIIPDWQDYTSGPGIRYPKTFGWLWKLVPVNVSDEAQEDEEHYLMHPAQTAQWDDPWGEVLAWKFDPTLAYTYEAYVRYPEEFGSKSGLSEEEVRRRLTARGLLNMADKKETR*', 'Nef', '6'),
('5688-5759;7992-8225', '5688', 'MSSNEEELRRRLRLIHFLHQTSKYYPEGPGTANQRRRRRRRWRQRWQQILALADRIYSFPDPPANTPLDLAIQQLQRLAIEELPNPPASAPEPLKDIAESP*', 'Rev', '17'),
('8255-9046', '8255', 'MGGVTSKKQRKXGGNLRERLLQARGETYGRLWDGLEGDYSQSQDGSGRGLXSLSCEPQKYCXGQFMNTPWRNPRAEGAKLDYRQQNMDDVDDDDDDLVGFPVTPXVPXRTMTYKLAIDMSHFIKEKGGLEGIYYSDRRHKILNLYLEKEEGIIPDWQNYTAGPGIRYPMCFGWLWKLVPVDVSDEAQEDEXHCLMHPAQTSQWDDPWGEVLAWKFDPXLAYNYKAFVKHPEEFGSXSGLSEEEVKRRLTARGLLKMADKKETS*', 'Nef', '12'),
('19-2292', '19', 'MDVNPTLLFLKVPAQNAISTTFPYTGDPPYSHGTGTGYTMDTVNRTHQYSERGRWTKNTETGAPQLNPIDGPLPKDNEPSGYAQTDCVLEAMAFLEESHPGIFENSCIETMEVVQQTRVDKLTQGRQTYDWTLNRNQPAATALANTIEVFRSNGLIANESGRLIDFLKDVMKSMDRDEVEITTHFQRKRRVRDNVTKKMVTQRTIGKKKHKLDKRSYLIRALTLNTMTKDAERGKLKRRAIATPGMQIRGFVYFVETLARSICEKLEQSGLPVGGNEKKAKLANVVRKMMTNSQDTEISFTITGDNTKWNENQNPRMFLAMITYITKNQPEWFRNILSIAPIMFSNKMARLGKGYMFESKSMKLRTQIPAEMLANIDLKYFNDSTKKKIEKIRPLLIDGTASLSPGMMMGMFNMLSTVLGVSILNLGQKRYTKTTYWWDGLQSSDDFALIVNAPNHAGIQAGVDRFYRTCKLLGINMSKKKSYINRTGTFEFTSFFYRYGFVANFSMELPSFGVSGVNESADMSIGVTVIKNNMINNDLGPATAQMALQLFIKDYRYTYRCHRGDTQIQTRRSFEIKKLWDQTRSKAGLLVSDGGPNLYNIRNLHIPEVCLKWELMDEDYQGRLCNPLNPFVSHKEIESVNNAVMMPAHGPAKNMEYDAVATTHSWVPKRNRSILNTSQRGILEDEQMYQRCCNLFEKFFPSSSYRRPVGISSMVEAMVSRARIDARIDFESGRIKKEEFAEIMKTCSTIEDLRRQK*', 'PB1', '8'),
('28-2307', '28', 'MERIKELRNLMSQSRTREILTKTTVDHMAIIKKYTSGRQEKNPSLRMKWMMAMKYPITADKRITEMIPERNEQGQTLWSKVNDAGSDRVMISPLAVTWWNRNGPVASTIHYPKIYKTYFEKVERLKHGTFGPVHFRNQVKIRRRVDINPGHADLSAKEAQDVIMEVVFPNEVGARILTSESQLTITKEKKEELQNCKISPLMVAYMLERELVRKTRFLPVAGGTSSVYIEVLHLTQGTCWEQMYTPGGEVRNDDVDQSLIIAARNIVRRAAVSADPLASLLEMCHSTQIGGTRMVDILRQNPTEEQAVDICKAAMGLRISSSFSFGGFTFKRTSGSSVKREEEMLTGNLQTLKLTVHEGYEEFTMIGKRATAILRKATRRLIQLIVSGRDEQSIVEAIVVAMVFSQEDCMVKAVRGDLNFVNRANQRLNPMHQLLRHFQKDAKVLFLNWGIEPIDNVMGMIGILPDMTPSTEMSMRGVRVSKMGVDEYSNAEKVVVSIDRFLRVRDQRGNVLLSPEEVSETQGTEKLTITYSSSMMWEINGPESVLINTYQWIIRNWETIKIQWSQNPTMLYNKMEFEPFQSLVPKAIRGQYSGFVRTLFQQMRDVLGTFDTTQIIKLLPFAAAPPKQSRMQFSSLTVNVRGSGMRILVRGNSPVFNYNKTTKKLTVLGKDAGTLTEDPDEGTAGVESAVLRGFLILGKEDRRYGPALSINELSNLAKGEKANVLIGQGDVVLVMKRKRDSSILTDSQTATKRIRMAIN*', 'PB2', '9'),
('46-1542', '46', 'MASQGTKRSYEQMETDGERQNATEIRASVGRMIGGIGRFYIQMCTELKLNDYEGRLIQNSLTIERMVLSAFDERRNKYLEEHPSAGKDPKKTGGPVYKRVDGKWVRELVLYDKEEIRRIWRQANNGDDATAGLTHIMIWHSNLNDTTYQRTRALVRTGMDPRMCSLMQGSTLPRRSGAAGAAVKGVGTMVLELIRMIKRGINDRNFWRGENGRKTRIAYERMCNILKGKFQTAAQKAMMDQVRESRNPGNAEIEDLTFLARSALILRGSVAHKSCLPACVYGPAVASGYDFEKEGYSLVGVDPFKLLQTSQVYSLIRPNENPAHKSQLVWMACNSAAFEDLRVSSFIRGTKVLPRGKLSTRGVQIASNENMDAIVSSTLELRSRYWAIRTRSGGNTNQQRASAGQISTQPTFSVQRNLPFDKTTIMAAFTGNTEGRTSDMRAEIIKMMESARPEEVSFQGRGVFELSDERATNPIVPSFDMSNEGSYFFGDNAEEYDN*', 'NP', '10'),
('33-1730', '33', 'MKAKLLVLLCTFTATYADTICIGYHANNSTDTVDTVLEKNVTVTHSVNLLEDSHNGKLCLLKGIAPLQLGNCSVAGWILGNPECELLISKESWSYIVETPNPENGTCYPGYFADYEELREQLSSVSSFERFEIFPKGSSWPNHTVTGVSASCSHNGKSSFYRNLLWLTRKNGLYPNLSMSYVNNKEKEVLVLWGVHHPPNIGDQRALYHTENAYVSVVSSHYSRRFTPEIAKRPKVRDQEGRINYYWTLLEPGDTIIFEANGNLIAPWYAFALSRGFGSGIITSNAPMDECDAKCQTPQGAINSSLPFQNVHPVTIGECPKYVRSAKLRMVTGLRNIPSIQSRGLFGAIAGFIEGGWTGMVDGWYGYHHQNEQGSGYAADQKSTQNAINGITNKVNSVIEKMNTQFTAVGKEFNKLERRMENLNKKVDDGFLDIWTYNAELLVLLENERTLDFHDSNVKNLYEKVKSQLKNNAKEIGNGCFEFYHKCNNECMESVKNGTYDYPKYSEESKLNREKIDGVKLESMGVYQILAIYSTVASSLVLLVSLGAISFWMCSNGSLQCRICI*', 'HA', '11'),
('21-1433', '21', 'MNPNQKIITIGSISIAIGIISLMLQIGNIISIWASHSIQTGSQNHTGVCNQRIITYENSTWVNHTYVNINNTNVIAGKDKTSVTLAGNSSLCSISGWAIYTKDNSIRIGSKGDVFVIREPFISCSHLECRTFFLTQGALLNDKHSNGTVKDRSPYRALMSCPLGEAPSPYNSKFESVAWSASACHDGMGWLTIGISGPDNGAVAVLKYNGIITETIKSWKKQILRTQESECVCVNGSCFTIMTDGPSNGAASYKIFKIEKGKVTKSIELNAPNFHYEECSCYPDTGTVMCVCRDNWHGSNRPWVSFNQNLDYQIGYICSGVFGDNPRPKDGEGSCNPVTVDGANGVKGFSYKYGNGVWIGRTKSNRLRKGFEMIWDPNGWTDTDSDFSVKQDVVAITDWSGYSGSFVQHPELTGLDCIRPCFWVELVRGLPKENTTIWTSGSSISFCGVNSDTANWSWPDGAELPFTIDK*', 'NA', '18'),
('27-56;529-864', '27', 'MDSHTVSSFQDILMRMSKMQLGSSSGDLNGMITQFESLKLYRDSLGEAVMRLGDLHSLQHRNGKWREQLGQKFEEIRWLIEEVRHKLKTTENSFEQITFMQALQLLFEVEQEIRTFSFQLI*', 'NS2', '20'),
('27-719', '27', 'MDSHTVSSFQVDCFLWHVRKQVADQGLGDAPFLDRLRRDQKSLKGRGSTLGLNIETATCVGKQIVERILKEESDEAFKMTMASALASRYLTDMTIEEMSRDWFMLMPKQKVAGPLCVRMDQAIMDKNIILKANFSVIFDRLENLTLLRAFTEEGAIVGEISPLPSLPGHTNEDVKNAIGVLIGGLEWNDNTVRVSETLQRFAWRSSNETGGPPFTPTQKRKMAGTIRSEV*', 'NS1', '20'),
('26-646', '26', 'MSLLTEVETYVLSIIPSGPLKAEIAQRLEDVFAGKNTDLEALMEWLKTRPILSPLTKGILGFVFTLTVPSERGLQRRRFVQNALNGNGDPNNMDRAVKLYRKLKREITFHGAKEIALSYSAGALASCMGLIYNRMGAVTTESAFGLICATCEQIADSQHKSHRQMVTTTNPLIRHENRMVLASTTAKAMEQMAGSSEQAAEAMGGC*', 'M1', '19'),
('26-52;742-1008', '26', 'MSLLTEVETPIKNEWGCRCNDSSDPLVVAASIIGIVHLILWIIDRLFSKSIYRIFKHGLKRGPSTEGVPESMREEYREEQQNAVDADDGHFVSIELE*', 'M2', '19'),
('221-1744', '221', 'MGARNSVLSGKXADELEKIRLRPGGXKKYMLKHVVWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVXETGTADKMPVTSRPTAPPSGRGGNYPVQQVGGNYTHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCXGEHQSAMQIIREIINEEAADWDLQHXQPGPIPAGQLRDPRGSDIAGTTSTVEEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDPAVKNWMTQTLLIQNANPDCKLVLXGLGMNPTLEEMLTACQGVGGPGQKARLMAEALKEALTPGQLPFAAVQQRGQRKTIKXWNCGKEGHSARQCRAPRRQGCWKCGKTGHVMAKCPERQAGFLGLGPWGKKPRNFPMAQIPQGLTPTAPPEDPAVDLLRNYMKMGRRQRENRERPYKEVTEDLLHLNSLFGEDQ*', 'Gag', '12'),
('1501-4569', '1501', 'MPRETGGFFRAWPMGKEAPQFPHGPDTSGVDTNCSPRGSSCGSTEELHEDGQKAEGEQRETLQGGDGGFAAPQFSLWRRPVVTAYIEEQPXEVLXDTGADDSXVAGIELGPNYTPKIVGXIGGFXNTKEYKDVKIKVLGKVIKGTIMTGDTPINIFGRNLLTAMGMSLNLPIAKVEPIKVTLKPGKDGPKLRQWXLSKEKIIALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNKVTQDFTEVQLGIPHPAGLAKRRRITVLDVGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQHTMRNVLEPFRKANPDVTLIQXMDDILIASDRTDLEHDRVVLQLKELLNSMGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPXKETWTXNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEXNKIILSQEQEGCXYQEGXPLEATVIKSQDNQWSYKIHQEDXILKVGKFAKIKNTHTNGVRLLAHVVQKIGKEAIVIWGQVPKFHXPVEREIWEQWWTDYWQVTWIPEWDFVSTPPLVRLVFNLVKEPIQGAETFYVDGSCNRQSKEGKAGYVTDRGRDRTKPLXQTTNQQAEXEAFHLALADSGPKANIIVDSQYVMGIIAGQPTESESRLVNQIIEEMIKKEAIYVAWVPAHKGIGGNQEXDHLVSQGIRQVLFLEKIEPAQEEHEKYHSNVKELVFKFGLPRLVAKQIVDTCDKCHQKGEAIHGQVNAELGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLASRWPITHLHTDNGANFTSQEVKMVAWWAGIEQTFGVPYNPQSQGXVEAMNHHLKTQIDRXREQANSIXTIVLMAVHCMNFKRRGGIGDMTPAERLVNMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTEIKVVPRRKAKIIKDYGGGKELDSGSHLEDTGEAREVA*', 'Pol', '12'),
('4499-5143', '4499', 'MEEEKSWIAVPTWRIPGRLEKWHSLIKHLKYNTKDLQKACYVPHHKVGWAWWTCSRXIFPLRDESHLEVQGYWNLTPEKGWLSTYAVRITWYSRNFWTDVTPDYADTLLHGTYFPCFSEGEVRRAIRGEKLLSCCKFPKAHKNQVPSLQYLALTVVSHVRSQGEDPTWKQWRGNSRRGLRLARKNSRRNKQGSSESFAEGVNFPGLAKVLGILA*', 'Vif', '12'),
('4971-5309', '4971', 'MSDPRERIPPGNSGEETVGEAFDWLERTVEEINRAAVNHLPRELIFQVWRRSWEYWHDEIGMSASYTKXRYLCLIQKALFMHCKKGCRCLGGEHGAGGWRPGPPPPPPPGLA*', 'vpX', '12'),
('5311-5616', '5311', 'MTERPPEDEAPQREPWDEWVVEVLEEVKEEALKHFDPRLLTALGNYIYDRHGDTLEGAGELIKILQRALFIHFRGGCNHSRIGHSGGGNPLSTIPPSRGVL*', 'vpR', '12'),
('5462-5752;7985-8080', '5462', 'METPLKEQESSLKSSREHSSSISEVDATTPESATLEEEILSQLYRPLEACYNKCYCKKCCYHCQHCFLKKGLGICYEQQRRRTPKKTKANTFSASNKSLSRRARNRQPKKEKKETVETEVATDLGLGR*', 'Tat', '12'),
('5688-5752;7985-8222', '5688', 'MSSNEEELRRRLRLIHFLHQTSPYPEGPGTANQRRRRRRRWRQRWQQILALADRIXSFPDPPANTPLELAXQQLQRLAIEEXPDPPASAPEPLKDTAXSP*', 'Rev', '12'),
('5758-8421', '5758', 'MGCLGNQLLIALLLLSALGIXCVQYVTVFYGVPAWKNATIPLFCATKNRDTWXTTQCLPDNDDYSELAINVTEAFDAWDNTVTEQAIEDVWNLFQTSIKPCVKLTPLCIAMRCNKTETDRWGLTGKPTTTASTTTKTTSKPSVITAXVINEGDPCIKNNSCAGLEXXPMIGCKFNMTGLRKDKQREYNETWYSRDIVCEQNSNEHETASKCYMNHCNTSVIRESCDKHYWDAIRFRYCAPPGYALLRCNDSNYSGFEPNCTKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRSNRTIISLNKYYNLTIRCRRPGNKTVLPVTIMSGLVFHSQPINEXPKQAWCWFGGNWKXAIREVKETLVKHPRYTGTNNTEKINXTAPAGGDPEVTFMWTNCRGEFLYCKMNWFXNWVDETXGFRWXXQNPKEKKRRNYVPCHIRQVXXTWHRVGKNVYLPPREGDLTCNSTVTSLIAEIDWIDKNETNITMSAEVAELYRLELGDYKLVXITPIGLAPTSVRRYTTTGASRNKRGVFVLGFLGFLATAGSAMGAASLTLSAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTXNLQTRVTAIEKYLKDQXQLNSWGCAFRQVCHTTVPWPNDTLXPNWXNMTWQEWERQVDFLEAXITQLXEEAQIQQEKXMYELQKLNSWDIFGNWFDLTSWIXYIQYGVLIVLGVIGLRIVIYVXQMLARLRQGYRPVFSSPPVYVQQIPIQKGQEPPTKEGEEGDGGDRGGNRSWPWQIEXIHFLIRQLIRLLSWXFNSCRDWLLRSXQILQPVLQSLSRILQXVREVIRVEITYLQYGWRYFQEAAQXWWKFARETLASAWGDLWETLGRVGRRLLAIPRRIRQGLXLTLL*', 'Env', '12'),
('1309-2841', '1309', 'MGVRNSVLSGKKADELEKIRLRPNGKKKYMLKHVVWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTTETMPKTSRPTAPSSGRGGNYPVQQIGGNYVHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGDHQAAMQIIRDIINEEAADWDLQHPQPAPQQGQLREPSGSDIAGTTSSVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDAAVKNWMTQTLLIQNANPDCKLVLKGLGVNPTLEEMLTACQGVGGPGQKARLMAEALKEALAPVPIPFAAAQQRGPRKPIKCWNCGKEGHSARQCRAPRRQGCWKCGKMDHVMAKCPDRQAGFLGLGPWGKKPRNFPMAQVHQGLMPTAPPEDPAVDLLKNYMQLGKQQREKQRESREKPYKEVTEDLLHLNSLFGGDQ*', 'Gag', '13'),
('2484-5666', '2484', 'VLELWERGTLCKAMQSPKKTGMLEMWKNGPCYGQMPRQTGGFFRPWSMGKEAPQFPHGSSASGADANCSPRGPSCGSAKELHAVGQAAERKAERKQREALQGGDRGFAAPQFSLWRRPVVTAHIEGQPVEVLLDTGADDSIVTGIELGPHYTPKIVGGIGGFINTKEYKNVEIEVLGKRIKGTIMTGDTPINIFGRNLLTALGMSLNFPIAKVEPVKVALKPGKDGPKLKQWPLSKEKIVALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNRVTQDFTEVQLGIPHPAGLAKRKRITVLDIGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRHVLEPFRKANPDVTLVQYMDDILIASDRTDLEHDRVVLQSKELLNSIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKIHQEDKILKVGKFAKIKNTHTNGVRLLAHVIQKIGKEAIVIWGQVPKFHLPVEKDVWEQWWTDYWQVTWIPEWDFISTPPLVRLVFNLVKDPIEGEETYYTDGSCNKQSKEGKAGYITDRGKDKVKVLEQTTNQQAELEAFLMALTDSGPKANIIVDSQYVMGIITGCPTESESRLVNQIIEEMIKKSEIYVAWVPAHKGIGGNQEIDHLVSQGIRQVLFLEKIEPAQEEHDKYHSNVKELVFKFGLPRIVARQIVDTCDKCHQKGEAIHGQANSDLGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFASQEVKMVAWWAGIEHTFGVPYNPQSQGVVEAMNHHLKNQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLINMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTDIKVVPRRKAKIIKDYGGGKEVDSSSHMEDTGEAREVA*', 'Pol', '13'),
('5596-6240', '5596', 'MEEEKRWIAVPTWRIPERLERWHSLIKYLKYKTKDLQKVCYVPHFKVGWAWWTCSRVIFPLQEGSHLEVQGYWHLTPEKGWLSTYAVRITWYSKNFWTDVTPNYADILLHSTYFPCFTAGEVRRAIRGEQLLSCCRFPRAHKYQVPSLQYLALKVVSDVRSQGENPTWKQWRRDNRRGLRMAKQNSRGDKQRGGKPPTKGANFPGLAKVLGILA*', 'Vif', '13'),
('6068-6406', '6068', 'MSDPRERIPPGNSGEETIGEAFEWLNRTVEEINREAVNHLPRELIFQVWQRSWEYWHDEQGMSPSYVKYRYLCLIQKALFMHCKKGCRCLGEGHGAGGWRPGPPPPPPPGLA*', 'vpX', '13'),
('6407-6712', '6407', 'MEERPPENEGPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNHIYNRHGDTLEGAGELIRILQRALFMHFRGGCIHSRIGQPGGGNPLSAIPPSRSML*', 'vpR', '13'),
('6558-6853;9062-9158', '6558', 'METPLREQENSLESSNERSSCISEADASTPESANLGEEILSQLYRPLEACYNTCYCKKCCYHCQFCFLKKGLGICYEQSRKRRRTPKKAKANTSSASNKPISNRTRHCQPEKAKKETVEKAVATAPGLGR*', 'Tat', '13'),
('6784-6853;9062-9315', '6784', 'MSNHEREEELRKRLRLIHLLHQTNPYPTGPGTANQRRQRKRRWRRRWQQLLALADRIYSFPDPPTDTPLDLAIQQLQNLAIESIPDPPTNTPEALCDPTEDSRSPQD*', 'Rev', '13'),
('6860-9499', '6860', 'MGCLGNQLLIAILLLSVYGIYCTLYVTVFYGVPAWRNATIPLFCATKNRDTWGTTQCLPDNGDYSEVALNVTESFDAWNNTVTEQAIEDVWQLFETSIKPCVKLSPLCITMRCNKSETDRWGLTKSITTTASTTSTTASAKVDMVNETSSCIAQDNCTGLEQEQMISCKFNMTGLKRDKKKEYNETWYSADLVCEQGNNTGNESRCYMNHCNTSVIQESCDKHYWDAIRFRYCAPPGYALLRCNDTNYSGFMPKCSKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRDNRTIISLNKYYNLTMKCRRPGNKTVLPVTIMSGLVFHSQPINDRPKQAWCWFGGKWKDAIKEVKQTIVKHPRYTGTNNTDKINLTAPGGGDPEVTFMWTNCRGEFLYCKMNWFLNWVEDRNTANQKPKEQHKRNYVPCHIRQIINTWHKVGKNVYLPPREGDLTCNSTVTSLIANIDWIDGNQTNITMSAEVAELYRLELGDYKLVEITPIGLAPTDVKRYTTGGTSRNKRGVFVLGFLGFLATAGSAMGAASLTLTAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTKNLQTRVTAIEKYLKDQAQLNAWGCAFRQVCHTTVPWPNASLTPKWNNETWQEWERKVDFLEENITALLEEAQIQQEKNMYELQKLNSWDVFGNWFDLASWIKYIQYGVYIVVGVILLRIVIYIVQMLAKLRQGYRPVFSSPPSYFQQTHIQQDPALPTREGKERDGGEGGGNSSWPWQIEYIHFLIRQLIRLLTWLFSNCRTLLSRVYQILQPILQRLSATLQRIREVLRTELTYLQYGWSYFHEAVQAVWRSATETLAGAWGDLWETLRRGGRWILAIPRRIRQGLELTLL*', 'Env', '13'),
('9333-9569', '9333', 'MGGAISMRRSRPSGDLRQRLLRARGETYGRLLGEVEDGYSQSPGGLDKGLSSLSCEGQVSFYKRKGGTGRDLLQCKKT*', 'Nef', '13'),
('221-1744', '221', 'MGARNSVLSGKXADELEKIRLRPGGXKKYMLKHVXWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVXETGTADKMPXTSRPTAPPSGRGGNYPVQQVGGNYTHLXLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMXNCXGEHQSAMQIIREIINEEAADWDLQHXQPXPIPAGQLRDPRGSDIAGTTSTVEEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDXFYKSXRAEQTDPAVKNWMTQTLLIQNANPDCKLVLXGLGMNPTLEEMLTACQGVGGPGQKARLMAEALXEALTPGQLPFAAVQQRGQRKTIKXWNCGKEGHSARXCRAPRRQXCWKCGKTGHVMAKCPXRQAGFLGLGPWGKKPRNFPMAQIPQGLTPTAPPEDPAVDLLRNXMKMGRRQRENRERPYKEVTEDLLHLNSLFGEDQ*', 'Gag', '14'),
('1501-4569', '1501', 'MPRXTGGFFRAWPMGKEAPQFPHGPDTSGVDTNCSPRGSSCGSTEELXEDGQKAEGEQRETLQGGDGGFAAPQFSLWRRPVVTAXIEEQPXEVLLDTGADDSXVAGIELGPNYTPKIVGXIGGFINTKEYKDVKIKVLGXXIKGTIMTGDTPINIFGRNLLTAMGMSLNLPIAKXEPIKVTLKPGKDGPKLRQWXLSKEKIIALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNKVTQDFTEVQLGIPHPAGLAKRRRITVLDVGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQHTMRNVLEPFRKANPDVTLIQXMDDILIASDRTXLEHDRVVLQLKELLNSMGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPXXETWTXNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEXNKIILSQEQEGCXYQEGXPLEATVIKSQDNQWSYKIHQEDXILKVGKFAKIKNTHTNGVRLLAHVVQKIGKEAIVIWGQVPKFHXPVEREXWEQWWTDYWQVTWIPEWDFVSTPPLVRLVFNLVKEPIQGAETFYVDGSCNRQSKEGKAGYVTDRGRDRTKPLEQTTNQQAEXEAFHLALADSGPKANIIVDSQYVMGIIAGQPTESESRLVNQIIEEMIKKEAIYVAWVPAHKGIGGNQEXDHLXSQGIRQVLFLEKIEPAQEEHEKYHSNVKELVFKFGLPRLVAKQIVDTCDKCHQKGXAIHGQVNAELGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLASRWPITHLXTDNGANFTSQEVKMVAWWAGIEQTFGVPYNPQSQGXVEAMNHHLKTQIDRXREQANSIXTIVLMAVHCMNFKRRGGIGDMTPAERLVNMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTEIKVVPRRKAKIIKDYGGGKXLDSGSHLEDTGEAREVA*', 'Pol', '14'),
('4499-5143', '4499', 'MEEEKXWIAVPTWRIPGRLEKWHSLIKHLKYNTKDLQKACYVPHHKVGWAWWTCSRXIFPLRDXSHLEVQGYWNLTPEKGWLSTYAVRITWYSXNFWTDVTPDYADTLLHGTYFPCFSEGEVRRAIRGEKLLSCCKFPKAHKNQVPSLQYLALTVVSHVRSQGEXPTWKQWRGNXRRGLRLAXKNSRRNKQGSSESFAEGVNFPGLAKVLGILA*', 'Vif', '14'),
('4971-5309', '4971', 'MSDPRERXPPGNSGEEXVGEAFDWXERTVEEINRAAVNHLPRELIFQVWRRSWEYWHDEIGMSASYTKXRYLCLIQKALFMHCKKGCRCLGGEHGAGGWRPGPPPPPPPGLA*', 'vpX', '14'),
('5311-5616', '5311', 'MTERPPEDEAPQREPWDEWVVEVLEEVKEEALKHFDPRLLTALGNYIYDRHGDTLEGAGELIXILQRALFIHFRGGCNHSRIGHSGGGNPLSTIPPSRGVL*', 'vpR', '14'),
('5462-5751;7984-8080', '5462', 'METPLKEQESSLXSSREHSSSISEVDATTPESATLEEEILSQLYRPLEACYNKCYCKKCCYHCQHCFLKKGLGICYEQQRRRTPKKTKANTFSASNKSLSRRARNRQPKKEKKETVETEVATDLGLGR*', 'Tat', '14'),
('5688-5759;7992-8222', '5688', 'MSSNEEELRRRLRLIHFLHQTSKYPEGPGTANQRRRRRRRWRQRWQQILALADRIXSFPDPPANTPLELAXQQLQXLAIEEXPDPPASAPEPLKDTAXSP*', 'Rev', '14'),
('5758-8421', '5758', 'MGCLGNQLLIALLLLSALGISCVQYXTVFYGXPAWKNATXPLFCAXXNRXTWXTTQCLPDNDDYSELAINVTEAFDAWDNTVTEQAIEDVWNLFQTSIKPCVKLTPLCIAMRCNKTETDRWGLTGKPTTTASTTTKTTSKPSVITAXVINEGDPCIKNNSCAGLEXXPMIGCKFNMTGLRKDKQREYNETWYSRDIVCEQNSNEXETASKCYMNHCNTSVIRESCDKHYWDAIRFRYCAPPGYALLRCNDSNYSGFEPNCTKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRSNRTIISLNKYYNLTXRCRRPGNKTVLPVTIMSGLVFHSQPINEXPKQAWCWFGGNWKXXIREVKETLVKHPRYTGTNNTEKINXTAPAGGDPEVTFMWTNCRGEFLYCKMNWFXNWVDETXGFRWNXQNPKEKKRRNYVPCHIRQVXXTWHXVGKNVYLPPREGDLTCNSTVTSLIAEIDWIDKNETNITMSAEVAELYRLELGDYKLVXITPIGLAPTSVRRYTTTGASRNKRGVFVLGFLGFLATAGSAMGAASLTLSAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTXNLQTRVTAIEKYLKDQXHLNSWGCAFRQVCHTTVPWPNDTLXPNWXNMTWQEWERQVDFLEAXITQLXEEAQIQQEKXMYELQKLNSWDIFGNWFDLTSWIXYIQYGVLIVLGVIGLRIVIYVXXMLARLRQGYRPVFSSPPVYVQQIPIQKGQEPPTKEGEEGDGGDRGGNRSWPWQIEXIHFLIRQLIRLLSWXFNSCRXWLLRSXQILQPVLQSLSRILQXVREVIRVEITYLQYGWRYFQEAAQXWWKFARETLASAWGDLWETLGRVGRRLLAIPRXIRQGLXLTLL*', 'Env', '14'),
('8255-9046', '8255', 'MGGVTSKKQRKHGGNLRERLLQARGETYGRLWDGLEGDYSQSQDGSGRGLSSLSCEPQKYCEGQFMNTPWRNPRAEGAKLDYRQQNMDDVDDDDDDLVGFPVTPKVPLRTMTYKLAIDMSHFIKEKGGLEGIYYSDRRHKILNLYLEKEEGIIPDWQNYTAGPGIRYPMCFGWLWKLVPVDVSDEAQEDEAHCLMHPAQTSQWDDPWGEVLAWKFDPELAYNYKAFVKHPEEFGSSSGLSEEEVKRRLTARGLLKMADKKETS*', 'Nef', '14'),
('9099-9890', '9099', 'MGGAISKKQHRRGGNLRERLLRARGETYGRLWEGLEEGYSQSLGASGKGLSSLSCEPQKYSEGQYMNTPWRNPTAEKAKLGYKQQNMDDVDDEDDDLVGVSVHPKVPLRAMTYKLAIDMSHFIKEKGGLEGIYYNEKRHRILDMYMEKEEGIIPDWQNYTLGPGTRYPMYFGWLWKLVPVDVSDEAQEDETHCLVHPAQTHQWDDPWGEVLAWKFDPELAYSYKAFIKYPEEFGSKSGLSEEEVKRRLTARGIYKMADKRETS*', 'Nef', '16'),
('1631-4642', '1631', 'FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSPSEAGADRQGTVSFNFPQVTLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTGATVRAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRNPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*', 'Pol', '5'),
('309-1841', '309', 'MGARNSVLSGKKADELEKIRLRPNGKKKYMLKHVVWAANELDRFGLAESLLENKEGCRKILSVLAPLMPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTTETMPKTSRPTAPSSGRGGNYPVQQIGGNYVHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGDHQAAMQIIRDIINEEAADWDLQHPQPAPQQGQLREPSGSDIAGTTSSVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDAAVKNWMTQTLLIQNANPDCKLVLKGLGVNPTLEEMLTACQGVGGPGQKARLMAEALKEALAPVPIPFAAAQQRGSRKPIKCWNCGKEGHSARQCRAPRRQGCWKCGKMDHVMAKCPDRQAGFLGLGPWGKKPRNFPMAQVHQGLMPTAPPEDPAVDLLKSYMQLGKQQREKQRESREKPYKEVTEDLLHLNSLFGGDQ*', 'Gag', '15'),
('5860-8499', '5860', 'MGCLGNQLLIAILLLSVYGIYGTLYVTVFYGVPAWRNATIPLFCATKNRDTWGTTQCLPDNGDYSEMALNVTESFDAWNNTVTEQAIEDVWQLFETSIKPCVKLSPLCITMRCNKSETDRWGLTKSITTTASTTSTTASAKVDMVNETSSCIAQDNCTGLEQEQMISCKFNMTGLKRDKKKEYNETWYSADLVCEQGNNTGNESRCYMNHCNTSVIQESCDKHYWDAIRFRYCAPPGYALLRCNDTNYSGFMPNCSKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRDNRTIISLNKYYNLTMKCRRPGNKTVLPVTIMSGLVFHSQPINDRPKQAWCWFGGKWKDAIKEVKQTIVKHPRYTGTNNTDKINLTAPGGGDPEVTFMWTNCRGEFLYCKMNWFLNWVEDRNTANQTSKEQHKRNYVPCHIRQIINTWHKVGRNVYLPPREGDLTCNSTVTSLIANIDWIDGNQTNITMSAEVAELYRLELGDYKLVEITPIGLAPTNVKRYTTGGTSRNKRGVFVLGFLGFLATAGSAMGAASLTLTAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTKNLQTRVTAIEKYLKDQAQLNAWGCAFRQVCHTTVPWPNASLTPEWNNETWQEWERKVDFLEENITALLEEAQIQQERNMYELQKLNSWDVFGNWFDLASWIKYIQYGVYIVVGVILLRIVIYIVQMLAKLRQGYRPVFSSPPSYFQQTHIQQDPALPTREGKEGDGGEGGGNSSWPWQIEYIHFLVRQLIRLLTWLFSNCRTLLSRVYQVLQPILQRLSATLQRIREVLRTELTYLQYGWSYFHEAVQAVWRSATETLAGAWGDLWETLRRGGRWILAIPRRIRQGLELTLL*', 'Env', '15'),
('8333-9124', '8333', 'MGGAISMRRSRPSGDLRQRLLRARGETYGRLLGEVEDGYSQSPGGLDKGLSSLSCEGQKYNQGQYMNTPWRNPAEEREKLAYRKQNMDDIDEEDDDLVGVSVRSKVPLRTMSYKLAIDMSHFIKEKGGLEGIYYSARRHRILDIYLEKEEGIIPDWQDYTSGPGIRYPKTFGWLWKLVPVNVSDEAQEDEEHYLMHPAQTSQWDDPWGEVLAWKFDPTLAYTYEAYVRYPEEFGSKSGLSEEEVRRRLTARGLLNMADKKETR*', 'Nef', '15'),
('1484-4666', '1484', 'VLELWERGTLCKAMQSPKKTGMLEMWKNGPCYGQMPRQTGGFFRPWSMGKEAPQFPHGSSASGADANCSPRGPSCGSAKELHAVGQAAERKAERKQREALQGGDRGFAAPQFSLWRRPVVTAHIEEQPVEVLLDTGADDSIVTGIELGPHYTPKIVGGIGGFINTKEYKNVEIEVLGKRIKGTIMTGDTPINIFGRNLLTALGMSLNFPIAKVEPVKVALKPGKDGPKLKQWPLSKEKIVALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNRVTQDFTEVQLGIPHPAGLAKRKRITVLDIGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRHVLEPFRKANPDVTLVQYMDDILIASDRTDLEHDRVVLQLKELLNSIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKIHQEDKILKVGKFAKIKNTHTNGVRLLAHVIQKIGKEAIVIWGQIPKFHLPVEKDVWEQWWTDYWQVTWIPEWDFISTPPLVRLVFNLVKDPIEGEETYYTDGSCNKQSKEGKAGYITDRGKDKVKVLEQTTNQQAELEAFLMALTDSGPKANIIVDSQYVMGIITGCPTESESRLVNQIIEEMIKKSEIYVAWVPAHKGIGGNQEIDHLVSQGIRQVLFLEKIEPAQEEHDKYHSNVKELVFKFGLPRIVARQIVDTCDKCHQKGEAIHGQTNSDLGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFASQEVKMVAWWAGIEHTFGIPYNPQSQGVVEAMNHHLKNQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLINMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTDIKVVPRRKAKIIKDYGGGKEVDSSSHMEDTGEAREVA*', 'Pol', '15'),
('5784-5852;8064-8315', '5784', 'MSNHEREEELRKRLRLIHLLHQTPYPTGPGTANQRRQRRRRWRRRWQQLLALADRIYSFPGPSTDTPLDLAIQQLQNLAIESIPGPPTNTPEALCDPTEDSRSPQD*', 'Rev', '15'),
('5558-5854;8064-8159', '5558', 'METPLREQENSLESSNERSSCISEADASTPESANLGEEILSQLYRPLEACYNTCYCKKCCYHCQFCFLKKGLGICYEQSRKRRRTPKKAKANTSSASNKPISNRTRHCQPEKAKKETVEKAVATAPGLGR*', 'Tat', '15'),
('4596-5240', '4596', 'MEEEKRWIAVPTWRIPERLERWHSLIKYLKYKTKDLQKVCYVPHFKVGWAWWTCSRVIFPLQEGSHLEVQGYWNLTPEKGWLSTYAVRITWYSKNFWTDVTPNYADILLHSTYFPCFTAGEVRRAIRGEQLLSCCRFPRAHKYQVPSLQYLALKVVSDVRSQGENPTWKQWRRDNRRGLRMAKQNSRGDKQRGGKPPTKGADFPGLAKVLGILA*', 'Vif', '15'),
('5407-5712', '5407', 'MEERPPENEGPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNHIYNRHGDTLEGAGELIRILQRALFMHFRGGCIHSRIGQPGGGNPLSAIPPSRSML*', 'VpR', '15'),
('5068-5406', '5068', 'MSDPRERIPPGNSGEETIGEAFEWLNRTVEEINREAVNHLPRELIFQVWQRSWEYWHDEQGMSPSYVKYRYLCLIQKALFMHCKKGCRCLGEGHGAGGWRPGPPPPPPPGLA*', 'Vpx', '15'),
('1799-2095', '1799', 'PQVTLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNF', 'Protease', '5'),
('2096-3775', '2096', 'PISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVL', 'Pol p66 RT', '5'),
('3416-3775', '3416', 'YVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVL', 'RNAse H', '5'),
('3776-4642', '3776', 'FLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTGATVRAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRNPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*', 'Integrase', '5'),
('1-1701', '1', 'MKAILVVLLYTFATANADTLCIGYHANNSTDTVDTVLEKNVTVTHSVNLLEDKHNGKLCKLRGVAPLHLGKCNIAGWILGNPECESLSTASSWSYIVETPSSDNGTCYPGDFIDYEELREQLSSVSSFERFEIFPKTSSWPNHDSNKGVTAACPHAGAKSFYKNLIWLVKKGNSYPKLSKSYINDKGKEVLVLWGIHHPSTSADQQSLYQNADTYVFVGSSRYSKKFKPEIAIRPKVRDQEGRMNYYWTLVEPGDKITFEATGNLVVPRYAFAMERNAGSGIIISDTPVHDCNTTCQTPKGAINTSLPFQNIHPITIGKCPKYVKSTKLRLATGLRNIPSIQSRGLFGAIAGFIEGGWTGMVDGWYGYHHQNEQGSGYAADLKSTQNAIDEITNKVNSVIEKMNTQFTAVGKEFNHLEKRIENLNKKVDDGFLDIWTYNAELLVLLENERTLDYHDSNVKNLYEKVRSQLKNNAKEIGNGCFEFYHKCDNTCMESVKNGTYDYPKYSEEAKLNREEIDGVKLESTRIYQILAIYSTVASSLVLVVSLGAISFWMCSNGSLQCRICI*', 'HA', '29'),
('221-1744', '221', 'MGARXSVLSGKKADELEKIRLRPGGKKKYMLKHVVWAANELDXFGLAESLLENKEGCQXILSXLAPLVPTGSENLKSXYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTADKMPATSRPTAPPSGRGGNYPVQQVGGNYTHLPLSPRTLNAWVKLXEEKKFGAEVVPGFXALSEGCXPYDINQMLNCXGEXQSAMQIIREIINEEAADWDLQHPQPGPIPAGXLRDPRGSDIAGTTSTVEEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKXGXKEPFQSYVDRFYKSLRAEQTDPAVKNWMTQTLLIQNANPDCKLVLKGLGMNPTLEEMLTACQGXGGPGQKARLMAEALKEALTPGQLPFAAVQQRGQRKTIKXWNCGKEGHSARQCRAPRRQGCWKCGXTGHVMAKCPERQAGFLGLGPWGKKPRNFPMAQIPQGLTPTAPPEDPAVDLLKNYMRMGRRQRXNRERPYKXVTEDLLHLNSLFGEDQ*', 'Gag', '17'),
('1-2274', '1', 'MDVNPTLLFLKIPAQNAISTTFPYTGDPPYSHGTGTGYTMDTVNRTHQYSEKGKWTTNTETGAPQLNPIDGPLPEDNEPSGYAQTDCVLEAMAFLEESHPGIFENSCLETMEVVQQTRVDKLTQGRQTYDWTLNRNQPAATALANTIEVFRSNGLTANESGRLIDFLKDVMESMNKEEIEITTHFQRKRRVRDNMTKKMVTQRTIGKKKQRLNKRGYLIRALTLNTMTKDAERGKLKRRAIATPGMQIRGFVYFVETLARSICEKLEQSGLPVGGNEKKAKLANVVRKMMTNSQDTEISFTITGDNTKWNENQNPRMFLAMITYITRNQPEWFRNILSMAPIMFSNKMARLGKGYMFESKRMKIRTQIPAEMLASIDLKYFNESTKKKIEKIRPLLIDGTASLSPGMMMGMFNMLSTVLGVSILNLGQKKYTKTIYWWDGLQSSDDFALIVNAPNHEGIQAGVDRFYRTCKLVGINMSKKKSYINKTGTFEFTSFFYRYGFVANFSMELPSFGVSGVNESADMSIGVTVIKNNMINNDLGPATAQMALQLFIKDYRYTYRCHRGDTQIQTRRSFELKKLWDQTQSKVGLLVSDGGPNLYNIRNLHIPEVCLKWELMDDDYRGRLCNPLNPFVSHKEIDSVNNAVVMPAHGPAKSMEYDAVATTHSWIPKRNRSILNTSQRGILEDEQMYQKCCNLFEKFFPSSSYRRPVGISSMVEAMVSRARIDARVDFESGRIKKEEFSEIMKICSTIEELRRQK*', 'PB1', '35'),
('1-2280', '1', 'MERIKELRDLMSQSRTREILTKTTVDHMAIIKKYTSGRQEKNPALRMKWMMAMRYPITADKRIMDMIPERNEQGQTLWSKTNDAGSDRVMVSPLAVTWWNRNGPTTSTVHYPKVYKTYFEKVERLKHGTFGPVHFRNQVKIRRRVDTNPGHADLSAKEAQDVIMEVVFPNEVGARILTSESQLAITKEKKEELQDCKIAPLMVAYMLERELVRKTRFLPVAGGTGSVYIEVLHLTQGTCWEQMYTPGGEVRNDDVDQSLIIAARNIVRRAAVSADPLASLLEMCHSTQIGGVRMVDILRQNPTEEQAVDICKAAIGLRISSSFSFGGFTFKRTSGSSVKKEEEVLTGNLQTLKIRVHEGYEEFTMVGRRATAILRKATRRLIQLIVSGRDEQSIAEAIIVAMVFSQEDCMIKAVRGDLNFVNRANQRLNPMHQLLRHFQKDAKVLFQNWGIESIDNVMGMIGILPDMTPSTEMSLRGIRVSKMGVDEYSSTERVVVSIDRFLRVRDQRGNVLLSPEEVSETQGTEKLTITYSSSMMWEINGPESVLVNTYQWIIRNWEIVKIQWSQDPTMLYNKMEFEPFQSLVPKATRSRYSGFVRTLFQQMRDVLGTFDTVQIIKLLPFAAAPPEQSRMQFSSLTVNVRGSGLRILVRGNSPVFNYNKATKRLTVLGKDAGALTEDPDEGTSGVESAVLRGFLILGKEDKRYGPALSINELSNLAKGEKANVLIGQGDVVLVMKRKRDSSILTDSQTATKRIRMAIN*', 'PB2', '36'),
('1-2151', '1', 'MEDFVRQCFNPMIVELAEKAMKEYGEDPKIETNKFAAICTHLEVCFMYSDFHFIDERGESIIVESGDPNALLKHRFEIIEGRDRIMAWTVVNSICNTTGVEKPKFLPDLYDYKENRFIEIGVTRREVHIYYLEKANKIKSEKTHIHIFSFTGEEMATKADYTLDEESRARIKTRLFTIRQEMASRSLWDSFRQSERGEETIEEKFEITGTMRKLADQSLPPNFPSLENFRAYVDGFEPNGCIEGKLSQMSKEVNAKIEPFLRTTPRPLRLPDGPLCHQRSKFLLMDALKLSIEDPSHEGEGIPLYDAIKCMKTFFGWKEPNIVKPHEKGINPNYLMAWKQVLAELQDIENEEKIPRTKNMKRTSQLKWALGENMAPEKVDFDDCKDVGDLKQYDSDEPEPRSLASWVQNEFNKACELTDSSWIELDEIGEDVAPIEHIASMRRNYFTAEVSHCRATEYIMKGVYINTALLNASCAAMDDFQLIPMISKCRTKEGRRKTNLYGFIIKGRSHLRNDTDVVNFVSMEFSLTDPRLEPHKWEKYCVLEIGDMLLRTAIGQVSRPMFLYVRTNGTSKIKMKWGMEMRRCLLQSLQQIESMIEAESSVKEKDMTKEFFENKSETWPIGESPRGVEEGSIGKVCRTLLAKSVFNSLYASPQLEGFSAESRKLLLIVQALRDNLEPGTFDLGGLYEAIEECLINDPWVLLNASWFNSFLTHALK*', 'PA', '34'),
('1-1410', '1', 'MNPNQKIITIGSVCMTIGMANLILQIGNIISIWISHSIQLGNQNQIETCNQSVITYENNTWVNQTYVNISNTNFAAGQSVVSVKLAGNSSLCPVSGWAIYSKDNSVRIGSKGDVFVIREPFISCSPLECRTFFLTQGALLNDKHSNGTIKDRSPYRTLMSCPIGEVPSPYNSRFESVAWSASACHDGINWLTIGISGPDNGAVAVLKYNGIITDTIKSWRNNILRTQESECACVNGSCFTVMTDGPSNGQASYKIFRIEKGKIVKSVEMNAPNYHYEECSCYPDSSEITCVCRDNWHGSNRPWVSFNQNLEYQIGYICSGIFGDNPRPNDKTGSCGPVSSNGANGVKGFSFKYGNGVWIGRTKSISSRNGFEMIWDPNGWTGTDNNFSIKQDIVGINEWSGYSGSFVQHPELTGLDCIRPCFWVELIRGRPKENTIWTSGSSISFCGVNSDTVGWSWPDGAELPFTIDK*', 'NA', '31'),
('1-1497', '1', 'MASQGTKRSYEQMETGGERQDATEIRASVGRMIGGIGRFYIQMCTELKLSDYDGRLIQNSITIERMVLSAFDERRNKYLEEHPSAGKDPKKTGGPIYRRVDGKWMRELILYDKEEIRRVWRQANNGEDATAGLTHIMIWHSNLNDATYQRTRALVRTGMDPRMCSLMQGSTLPRRSGAAGAAVKGVGTIAMELIRMIKRGINDRNFWRGENGRRTRVAYERMCNILKGKFQTAAQRAMMDQVRESRNPGNAEIEDLIFLARSALILRGSVAHKSCLPACVYGLAVASGHDFEREGYSLVGIDPFKLLQNSQVVSLMRPNENPAHKSQLVWMACHSAAFEDLRVSSFIRGKKVIPRGKLSTRGVQIASNENVETMDSNTLELRSRYWAIRTRSGGNTNQQKASAGQISVQPTFSVQRNLPFERATVMAAFSGNNEGRTSDMRTEVIRMMESAKPEDLSFQGRGVFELSDEKATNPIVPSFDMSNEGSYFFGDNAEEYDS*', 'NP', '32'),
('6602-9265', '6602', 'MGCLGNQLLIALLLVSVLEICCVQYVTVFYGVPAWKNATIPLFCATRNRDTWGTTQCLPDNDDYSELAVNITEAFDAWNNTVTEQAIEDVWNLFETSIKPCVKLTPLCIAMRCNKTETDRWGLTGRAETTTTAKSTTSTTTTTVTPKVINEGDSCIKNNSCAGLEQEPMIGCKFNMTGLKRDKKIEYNETWYSRDLICEQPANGSESKCYMQHCNTSVIQESCDKHYWDAIRFRYCAPPGYALLRCNDSNYSGFAPKCSKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGNSNRTIISLNKYYNLTMKCRRPGNKTVLPVTIMSGLVFHSQPINERPKQAWCRFGGNWSEAIQEVKETLVKHPRYTGTNDTRKINLTAPAGGDPEVTFMWTNCRGEFLYCKMNWFLNWVEDRDQNSNRWKQQKKPEQQKRNYVPCHIRQIINTWHKVGKNVYLPPREGDLTCNSTVTSLIAEIDWINNNETNITMSAEVAELYRLELGDYKLVEITPIGLAPTDVRRYTTTGASRNKRGVFVLGFLGFLATAGSAMGAASLTLSAQSRTLLAGIVQQQQQLLDVVKRQHELLRLTVWGTKNLQTRVTAIEKYLKDQAQLNSWGCAFRQVCHTTVPWPNDSLVPNWDNMTWQEWEGKVDFLEANITQLLEEAQIQQEKNMYELQKLNSWDIFGNWFDLTSWIRYIQYGVLIVLGVVGLRIVIYVVQMLARLRQGYRPVFSPPPAYVQQIPIHKDQEPPTKEGEEGEGGDRGGSRSWPWQIEYIHFLIRQLIRLLTWLFSSCRDWLLRIYQILQPVLQRLSRTLQRVREVIRIEITYLQYGWSYFQEAAQAWWKFARETLASAWRDIWETLGRVGRGILAIPRRVRQGLELALL*', 'Env', '16'),
('6155-6460', '6155', 'MAERPPEDEAPQREPWDEWVVEVLEEIKEEALKHFDPRLLTALGNYIYDRHGDTLEGAGELIRILQRALFIHFRSGCAHSRIGQSRGGNPLSTIPPSRAML*', 'Vpr', '16'),
('6297-6595;8825-8924', '6297', 'MIDMETPLKEQENSLESYREHSSSISEVDVPTPESANLEEEILSQLYRPLEPCYNKCYCKRCCYHCQHCFLKKGLGICYEQHRRRTPKKTKTNPLPASNNRSLSTRTRNRQPKKEKKEKVETEVAADLGLGR*', 'Tat', '16'),
('6532-6595;8825-9066', '6532', 'MSSTEEELRKRLRLIHFLHQTTDPYPQGPGTANQRRRRRRRWRQRWQQILALADRIYSFPNPPTDTPLDLAIQQLQGLAIEDLPDPPTSAPETLKDAAKSS*', 'Rev', '16'),
('5815-6153', '5815', 'MSDPRERIPPGNSGEETIEEAFEWLNRTVEGINRAAVNHLPRELIFQVWQRSWEYWHDEMGMSESYTKYRYLCLIQKALFMHCKKGCRCLGEGHGAGGWRTGPPPPPPPGLA*', 'Vpx', '16'),
('5343-5987', '5343', 'MEEEKNWIVVPTWRIPERLERWHSLIKHLKYNTKDLQMACYVPHHKVGWAWWTCSRVIFPLRDKTHLEVQGYWNLTPEKGWLSTHAVRITWYSRNFWTDVTPDCADTLLHSTYFPCFSEGEVQRAIRGEKLLSCCKFPKAHKNQVPSLQYLALTVVSHVRSQREDPTWKQWRGNNRRGLRMAKQNSRRNKQGSSKSPAEGANFPGLAKVLGILA*', 'Vif', '16'),
('2354-5413', '2354', 'KTGGFFRVWPMGKEAPQFPHGPDASGADTNCSPRGSSCGSTEELHEDGQKAEGEQRETLQGGDRGFAAPQFSLWRRPVVTAYIEEQPVEVLLDTGADDSIVTGIELGPNYTPKIVGGIGGFINTKEYKDVKIKVLGKVIKGTIMTGDTPINIFGRNLLTAMGMSLNFPIAKVEPIKVTLKPGKEGPKLRQWPLSKEKIIALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNKVTQDFTEVQLGIPHPAGLAKRRRITVLDVGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRNVLEPFRKANPDVTLIQYMDDILIASDRTDLEHDRVVLQLKELLNGIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPIEATVIKSQDNQWSYKIHQEDKVLKVGKFAKVKNTHTNGVRLLAHVVQKIGKEALVIWGEVPKFHLPVEREIWEQWWTDYWQVTWIPDWDFVSTPPLVRLVFNLVKEPIQGAETFYVDGSCNRQSREGKAGYVTDRGRDKAKLLEQTTNQQAELEAFYLALADSGPKANIIVDSQYVMGIVAGQPTESESRLVNQIIEEMIKKEAIYVAWVPAHKGIGGNQEVDHLVSQGIRQVLFLEKIEPAQEEHEKYHSNVKELVFKFGIPRLVAKQIVDTCDRCHQKGEAIHGQVNAELGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFTSQEVKMVAWWAGIEQTFGVPYNPQSQGVVEAMNHHLKTQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLVNMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWRGPGELLWKGEGAVILKVGTEIKVVPRRKAKIIKDYGGGKELDSGSHLEDTGEAREVA*', 'Pol', '16'),
('1065-2588', '1065', 'MGARNSVLSGKKADELEKIRLRPNGKKKYMLKHVVWAANELDRFGLAESLLDNKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTADKMPATSRPTAPPSGRGGNYPVQQVGGNYVHLPLSPRTLNAWVKLVEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGEHQAAMQIIREIINEEAADWDLQHPQPGPLPAGQLREPRGSDIAGTTSTVEEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDPAVKNWMTQTLLIQNANPDCKLVLKGLGMNPTLEEMLTACQGIGGPGQKARLMAEALKEALRPDQLPFAAVQQKGQRRTIKCWNCGKEGHSARQCRAPRRQGCWGCGKTGHVMAKCPERQAGFLGFGPWGKKPRNFPMAQMPQGLTPTAPPEDPAVDLLKNYMKMGRKQRENRERPYKEVTEDLLHLNSLFGEDQ*', 'Gag', '16'),
('5462-5751;7984-8083', '5462', 'METPLKEQESSLESSREHSSSISEVDATTPESATLEEEILSQLYRPLEACYNKCYCKKCCYHCQHCFLKKGLGXCYEQQRRRTPKKTKANTFSASNNRSLSRRARNRQPKKEKKKTVEAEVATDLGLGR*', 'Tat', '17'),
('4971-5309', '4971', 'MSDPRERIPPGNSGEETVGEAFDWLERTVEEINRAAVNHLPRELIFQVWRRSWEYWHDEIGMSASYTKYRYLCLIQKALFMHCKKGCRCLGGEHGAGGWRSGPPPPPPPGLA*', 'Vpx', '17'),
('5311-5616', '5311', 'MTERPPEDEAPQREPWDEWVVEVLEEVKEEALKHFDPRLLTALGNYIYDRHGDTLEGAGELIRILQRALFIHFRGGCNHSRIGHSGGGNPLSTIPPSRGVL*', 'Vpr', '17'),
('4499-5143', '4499', 'MEEEKSWIAVXTWRIPGRLEKWHSLIKHLKYNTKDLQKACYVPHHKVGWAWWTCSRVIFPLRDESHLEVQGYWSLTPEXXWLSTYAXXITWYSRNFWTDVTPDXADTLLHGTYFPCFSEGEVRRAIRGEKLLSCCKFPKAHKNQVPSLQYLALTVVSHVRSQGEDPTWKQWRGNSRRGLRLARKNSRRNKQGSSESFAEGVNFPGLAKVLGILA*', 'Vif', '17'),
('8258-9043', '8258', 'MGGVTSKKQRKHGGNLRERLLQARGETYGRLWDGLEGEYSQSQDVSGKGLSSLSCEP:::::::::::::RNPTAERAKLDYRQQNMDDVDDDX:XXFPVTPRVPLRTMTYKLAIDMSHFIKEKGGLEGIYYSDRRHRILNLYLEKEEGIIPDWQNYTAGPGIRYPMCFGWLWKLVPVDVSDEAQEDEAHCLMHPAQTSQWDDPWGEVLAWKFDPELAYNYMAFVKHPEEFGSRSGLSEEEVKRRLTARGLLKMADKKETS*', 'Nef', '17'),
('1501-4569', '1501', 'MPRETGGFFRAWPMGKEAPQFPHGPDTSGVDTNCSPRGSSCGSTEELHEDGQKAEGXQRETLQGXDGGFAAPQFSLWRRPVVTAYIEEQPVEVLLDTGADDSXVAGIELGPNYTPKIVGXIGGFINTKEYKDVKIKVLGXVIKGTIMTGDTPINIFGRNLLTAMGMSLNLPIAKVEPIKVTLKPGKDGPKLRQWPLSKEKIIALXEICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNKVTQDFTEVQXGIPHPAGLAKRRRITVLDVGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVXPQGWKGSPAIFQHXMRNVLEPFRKANPDVXLIQYMDXILIASXRTDLEHDRVVLQLKELLNSMGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQXLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEEXKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKIHQEDKILKVGKFAKIKNTHTNGVRLLAXVVQKIGKEAIVIWGQVPKFHLPVEREIWEQWWTDYWQVTWIPEWDFVSTPPLVRXVFNLVKEPIQGAETFYVDGSCNRQSKEGKAGYVTDRXRDRTKXLEQTTNQQAXLEAFYLALADSGPXANIIXDSQYVMGIIAGQPXESESRLVNQIIEEMIKKEAIYVXWVPAHKGIGGNQEVDHLXSQGIRQVLFLEKIEPAQEEHEKYHSNVKXLVFKFGLPRLVAKQIVDTCDKCHQKGEAIHGQVNAELGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLASRWPITHLHTDNGANFTSQEVKMVAWWAXIEQTFGVPYNPQSXGVVEAMNHHLKTQIDRIREQANSIETIVLMAXHCMNFKRRGGIGDMTPAERLVNMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTEIKVVPRRKAKIIKDYGGGKELDSGSXLEDTGEAREVA*', 'Pol', '17'),
('5758-8424', '5758', 'MGCLGNQLLIALLLLSALGISCVQYVTVFYGIPAWKNATVPLFCATENRDTWGTTQCLPDNNDYSELAINVTEAFDAWDNTVTEQAIEDVWNLFETSIKPCVKLTPLCIAMRCNKTETDRWGLTGKPVTTTTSTTTKSTSKPPALTAKVINENDPCIXTDNCAGLEQEPMISCKFNMTGLXRDKKKEYNETWYSRDIVCEQNNNGNENESKCYMNHCNTSVIQESCDKHYWDAIRFRYCAPPGYALLRCNDSNYSGFEPNCTKVVVSSCTRMMETQTSTWFGFNGTRAENRTYIYWHGRSNRTIISLNKYYNLTMSCRRPGKKIVLPVTITSGLIFHSQTINKRPKQAWCWFXGXWKGXIREVKETLVKHPRYTGTNDTXXINLTAPXGGDXEVTFMWTNCRGEFLYCKMNWFLNWVDETNGFRW::QXXKEKKRRNYVPCHIRQVIXTWHXVGKNVYLPPREGXXTCNSTVTSLIAEIDWIDKNETNITMSAEVAELYRLELGDYKLVEITPIGLAPTSXRRYTTTGASRNKRGVFVLGFLGFLXTAGSAMGAASLTLSAQSRTLLAGIVQQQQQLLDVVKRQQELLRLTVWGTKNLQTRVTAIEKYLKDQAHLNSWGCAFRQVCHTTVPWPNDTLMPNWDNMTWQEWERQVDFLEANITQLLEEAQIQQEENMYELQKLNSWDIFGNWFDLTSWIKYIQYGVLIVLGVIGLRIVIYVVQMLARLRQGYRPVFSSPPVYVQQIPIQKGQEPPTKEGEEEDGGGRGGNRSWPWQIEYIHFLIRQLIRLLTWLFNSCRDWLLRSCQILQPVLQSLSRTLQRVREVIRVEIAYLQYGWRYFQEAAQAWWKFARETLASAWRDLWETLGRVGRGILAIPRRIRQGLELTLL*', 'Env', '17'),
('536-2068', '536', 'MGVRNSVLSGKKADELEKIRLRPNGKKKYMLKHVVWAANELDRFGLAESLLENKEGCQKILSVLAPLVPTGSENLKSLYNTVCVIWCIHAEEKVKHTEEAKQIVQRHLVVETGTTETMPKTSRPTAPSSGRGGNYPVQQIGGNYVHLPLSPRTLNAWVKLIEEKKFGAEVVPGFQALSEGCTPYDINQMLNCVGDHQAAMQIIRDIINEEAADWDLQHPQPAPQQGQLREPSGSDIAGTTSSVDEQIQWMYRQQNPIPVGNIYRRWIQLGLQKCVRMYNPTNILDVKQGPKEPFQSYVDRFYKSLRAEQTDAAVKNWMTQTLLIQNANPDCKLVLKGLGVNPTLEEMLTACQGVGGPGQKARLMAEALKEALAPVPIPFAAAQQRGPRKPIKCWNCGKEGHSARQCRAPRRQGCWKCGKMDHVMAKCPDRQAGFLGLGPWGKKPRNFPMAQVHQGLMPTAPPEDPAVDLLKNYMQLGKQQREKQRESREKPYKEVTEDLLHLNSLFGGDQ*', 'Gag', '37'),
('1714-4893', '1714', 'LELWERGTLCKAMQSPKKTGMLEMWKNGPCYGQMPRQTGGFFRPWSMGKEAPQFPHGSSASGADANCSPRGPSCGSAKELHAVGQAAERKAERKQREALQGGDRGFAAPQFSLWRRPVVTAHIEGQPVEVLLDTGADDSIVTGIELGPHYTPKIVGGIGGFINTKEYKNVEIEVLGKRIKGTIMTGDTPINIFGRNLLTALGMSLNFPIAKVEPVKVALKPGKDGPKLKQWPLSKEKIVALREICEKMEKDGQLEEAPPTNPYNTPTFAIKKKDKNKWRMLIDFRELNRVTQDFTEVQLGIPHPAGLAKRKRITVLDIGDAYFSIPLDEEFRQYTAFTLPSVNNAEPGKRYIYKVLPQGWKGSPAIFQYTMRHVLEPFRKANPDVTLVQYMDDILIASDRTDLEHDRVVLQSKELLNSIGFSTPEEKFQKDPPFQWMGYELWPTKWKLQKIELPQRETWTVNDIQKLVGVLNWAAQIYPGIKTKHLCRLIRGKMTLTEEVQWTEMAEAEYEENKIILSQEQEGCYYQEGKPLEATVIKSQDNQWSYKIHQEDKILKVGKFAKIKNTHTNGVRLLAHVIQKIGKEAIVIWGQVPKFHLPVEKDVWEQWWTDYWQVTWIPEWDFISTPPLVRLVFNLVKDPIEGEETYYTDGSCNKQSKEGKAGYITDRGKDKVKVLEQTTNQQAELEAFLMALTDSGPKANIIVDSQYVMGIITGCPTESESRLVNQIIEEMIKKSEIYVAWVPAHKGIGGNQEIDHLVSQGIRQVLFLEKIEPAQEEHDKYHSNVKELVFKFGLPRIVARQIVDTCDKCHQKGEAIHGQANSDLGTWQMDCTHLEGKIIIVAVHVASGFIEAEVIPQETGRQTALFLLKLAGRWPITHLHTDNGANFASQEVKMVAWWAGIEHTFGVPYNPQSQGVVEAMNHHLKNQIDRIREQANSVETIVLMAVHCMNFKRRGGIGDMTPAERLINMITTEQEIQFQQSKNSKFKNFRVYYREGRDQLWKGPGELLWKGEGAVILKVGTDIKVVPRRKAKIIKDYGGGKEVDSSSHMEDTGEAREVA*', 'Pol', '37'),
('4823-5467', '4823', 'MEEEKRWIAVPTWRIPERLERWHSLIKYLKYKTKDLQKVCYVPHFKVGWAWWTCSRVIFPLQEGSHLEVQGYWHLTPEKGWLSTYAVRITWYSKNFWTDVTPNYADILLHSTYFPCFTAGEVRRAIRGEQLLSCCRFPRAHKYQVPSLQYLALKVVSDVRSQGENPTWKQWRRDNRRGLRMAKQNSRGDKQRGGKPPTKGANFPGLAKVLGILA*', 'Vif', '37'),
('5295-5633', '5295', 'MSDPRERIPPGNSGEETIGEAFEWLNRTVEEINREAVNHLPRELIFQVWQRSWEYWHDEQGMSPSYVKYRYLCLIQKALFMHCKKGCRCLGEGHGAGGWRPGPPPPPPPGLA*', 'vpX', '37'),
('5634-5945', '5634', 'MEERPPENEGPQREPWDEWVVEVLEELKEEALKHFDPRLLTALGNHIYNRHGDTLEGAGELIRILQRALFMHFRGGCIHSRIGQPGGGNPLSAIPPSRSMRML*', 'vpR', '37'),
('5954-6168;8463-8508', '5954', 'MEPVDPRLEPWKHPGSRPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQPTSHFRGEPTGPKE*', 'Tat', '37'),
('6093-6168;8463-8737', '6093', 'MAGRSGDSDEELIRTVRLIKLLYQSNPPPTSEGSRQARRNRRRRWRERQRQIHSISDRILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTPGTQRVGSPQILVESPTVLESGTKE*', 'Rev', '37'),
('6185-6430', '6185', 'MQSIQIEIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLINRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL*', 'vpu', '37'),
('6345-8948', '6345', 'MRVKEKYQHLWRWGWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEAKTTLFCASNAKAYEKEVHNIWATHACVPTDPNPQEIVLGNVTENFNMWKNDMVDQMHEDIISLWDQSLKPCVKLTSLCVTLKCSNFTGKSNVTYKGDMEVKNCSFNVTTEIRDKKQKVYALFYRLDITPLDDNSSEYILINCNSSTITQACPKVNFDPIPIHYCAPAGYAILKCNNKTFNGTGPCHNVSTVQCTHGIKPVVSTQLLLNGSLAEGEIIIRSENLTDNVKTIIVHFNESVEITCTRPNNNTRKSISIGPGQAIYATGDIIGDIRQAHCNISKENWNKTLQWVRGKLKEHFPNKTIVFKPSSGGDLEITTHSFNCRGEFFYCNTSKLFNSTDNSTHMGTENNTIITIPCRIKQIINMWQEVGRAMYAPPIEGNITCKSNITGLLLVRDGGWDNSTNDTETFRPGGGDMRDNWRSELYKYKVVEVKPLGIAPTKAKRRVVEREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQDNLLRAIEAQQHMLQLTVWGIKQLQARVLAIERYLQDQQLLGIWGCSGKLICTTAVPWNDSWSNKSQTDIWENMTWMQWDREISRHTDTIYRLLEDSQNQQEKNEKDLLALDSWKNLWNWFSITRWLWYIKIFIMIVGGLIGLRIIFAVLSIVNRVRQGYSPLSFQTHLPLPRGADRPEGIEEEGGERDRDRSIRLVTGSLALIWDDLRSLCLFSYHRLRDLLLIVTRTVELLGRRGWEALKYWWNLLLYWSQELKNSAVSLLNATAIAVRQYGWSYFHEAVQAVWRSATETLAGAWGDLWEILRRGGRWILAIPRRIRQGLELTLL*', 'Env', '37'),
('8782-9573', '8782', 'MGGAISMRRSRPSGDLRQRLLRARGETYGRFLGEVEDGYSQSPGGLDKGSSSLSCEGQKYNQGQHMNTPWRNPAEEGEKLAYRKQNMDDIDEEDDDLVGVSVRPKVLLRTMSYKLAIDMSHFIKEKGGLEGIYYSARRHRILDIYLEKEEGIIPDWQDYTSGPGIRYPKTFGWLWKLVPVDVSDEAQEDEEHYLMHPAQTSQWDDPWGEVLAWKFDPTLAYTYEAYVRYPEEFGSKSGLSEEEVRRRLTARGLLNMADKKETR*', 'Nef', '37'),
('6912-7121', '6912', 'MGSIVLYMSQSFMVYQLGGMRQFPSFVQPRIGILGEQLSAYQIMVIIQKWPLMLQKALMPGIIQSQNRQ*', 'Env ARF 1', '1'),
('6784-7005', '6784', 'MSNHEREEELRKRLRLIHLLHQTSKYGMSWESAAYRHLAFKCLWDLLYSICHSLLWCTSLEECDNSPLLCNQE*', 'Env ARF 10', '1'),
('1-660', '1', 'MDSNTMSSFQVDCFLWHIRKRFADNGLGDAPFLDRLRRDQKSLKGRGNTLGLDIETATLVGKQIVEWILKEESSETLRMTIASVPTSRYLSDMTLEEMSRDWFMLMPRQKIIGPLCVRLDQAIMEKNIVLKANFSVIFNRLETLILLRAFTEEGAIVGEISPLPSLPGHTYEDVKNAVGVLIGGLEWNGNTVRVSENIQRFAWRNCDENGRPSLPPEQK*', 'NS1', '33'),
('1-366', '1', 'MDSNTMSSFQDILMRMSKMQLGSSSEDLNGMVTRFESLKIYRDSLGETVMRMGDLHYLQSRNEKWREQLGQKFEEIRWLIEEMRHRLKATENSFEQITFMQALQLLLEVEQEIRAFSFQLI*', 'NS2', '33'),
('1-759', '1', 'MSLLTEVETYVLSIIPSGPLKAEIAQRLESVFAGKNTDLEALMEWLKTRPILSPLTKGILGFVFTLTVPSERGLQRRRFVQNALNGNGDPNNMDRAVKLYKKLKREITFHGAKEVSLSYSTGALASCMGLIYNRMGTVTTEAAFGLVCATCEQIADSQHRSHRQMATTTNPLIRHENRMVLASTTAKAMEQMAGSSEQAAEAMEVANQTRQMVHAMRTIGTHPSSSAGLKDDLLENLQAYQKRMGVQMQRFK*', 'M1', '30'),
('1-294', '1', 'MSLLTEVETPTRSEWECRCSDSSDPLVIAANIIGILHLILWITDRLFFKCIYRRFKYGLKRGPSTEGVPESMREEYQQEQQSAVDVDDGHFVNIELE*', 'M2', '30')
;
-- ----------------------------
-- Table structure for sequenceanalysis.drug_resistance
-- ----------------------------
CREATE TABLE sequenceanalysis.drug_resistance
(
RowId serial NOT NULL,
--virus_strain VARCHAR(45) NOT NULL,
ref_nt_id INTEGER NOT NULL,
class VARCHAR(45) DEFAULT NULL,
--protein VARCHAR(45) NOT NULL,
ref_aa_id INTEGER NOT NULL,
aa_position INTEGER NOT NULL,
aa_insert_index INTEGER NOT NULL,
reference_aa VARCHAR(2) NOT NULL,
mutant_aa VARCHAR(2) NOT NULL,
drug VARCHAR(45) NOT NULL,
--Container ENTITYID NOT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_drug_resistance PRIMARY KEY (rowId)
--NOTE: depreciated
-- CONSTRAINT fk_drug_resistance_ref_nt_id FOREIGN KEY (ref_nt_id)
-- REFERENCES sequenceanalysis.ref_nt_sequences (rowid) MATCH SIMPLE
-- ON UPDATE NO ACTION ON DELETE NO ACTION,
-- CONSTRAINT fk_drug_resistance_ref_aa_id FOREIGN KEY (ref_aa_id)
-- REFERENCES sequenceanalysis.ref_aa_sequences (rowid) MATCH SIMPLE
-- ON UPDATE NO ACTION ON DELETE NO ACTION
)
WITH (OIDS=FALSE);
-- ----------------------------
-- Records of virus_resistance
-- ----------------------------
INSERT INTO sequenceanalysis.drug_resistance
(ref_nt_id, ref_aa_id, class, aa_position, aa_insert_index, reference_aa, mutant_aa, drug)
VALUES
('5', '104', 'Protease', '23', '0', 'L', 'I', 'NFV'),
('5', '104', 'Protease', '24', '0', 'L', 'I', 'ATV'),
('5', '104', 'Protease', '24', '0', 'L', 'I', 'FPV'),
('5', '104', 'Protease', '24', '0', 'L', 'I', 'IDV'),
('5', '104', 'Protease', '24', '0', 'L', 'I', 'LPV'),
('5', '104', 'Protease', '24', '0', 'L', 'I', 'NFV'),
('5', '104', 'Protease', '24', '0', 'L', 'I', 'SQV'),
('5', '104', 'Protease', '30', '0', 'D', 'N', 'NFV'),
('5', '104', 'Protease', '32', '0', 'V', 'I', 'DRV'),
('5', '104', 'Protease', '32', '0', 'V', 'I', 'FPV'),
('5', '104', 'Protease', '32', '0', 'V', 'I', 'IDV'),
('5', '104', 'Protease', '32', '0', 'V', 'I', 'LPV'),
('5', '104', 'Protease', '32', '0', 'V', 'I', 'TPV'),
('5', '104', 'Protease', '33', '0', 'L', 'F', 'ATV'),
('5', '104', 'Protease', '33', '0', 'L', 'F', 'DRV'),
('5', '104', 'Protease', '33', '0', 'L', 'F', 'FPV'),
('5', '104', 'Protease', '33', '0', 'L', 'F', 'LPV'),
('5', '104', 'Protease', '33', '0', 'L', 'F', 'NFV'),
('5', '104', 'Protease', '33', '0', 'L', 'F', 'TPV'),
('5', '104', 'Protease', '46', '0', 'M', 'I', 'ATV'),
('5', '104', 'Protease', '46', '0', 'M', 'I', 'FPV'),
('5', '104', 'Protease', '46', '0', 'M', 'I', 'IDV'),
('5', '104', 'Protease', '46', '0', 'M', 'I', 'LPV'),
('5', '104', 'Protease', '46', '0', 'M', 'I', 'NFV'),
('5', '104', 'Protease', '46', '0', 'M', 'I', 'TPV'),
('5', '104', 'Protease', '46', '0', 'M', 'L', 'ATV'),
('5', '104', 'Protease', '46', '0', 'M', 'L', 'FPV'),
('5', '104', 'Protease', '46', '0', 'M', 'L', 'IDV'),
('5', '104', 'Protease', '46', '0', 'M', 'L', 'LPV'),
('5', '104', 'Protease', '46', '0', 'M', 'L', 'NFV'),
('5', '104', 'Protease', '46', '0', 'M', 'L', 'TPV'),
('5', '104', 'Protease', '47', '0', 'I', 'V', 'ATV'),
('5', '104', 'Protease', '47', '0', 'I', 'V', 'DRV'),
('5', '104', 'Protease', '47', '0', 'I', 'V', 'FPV'),
('5', '104', 'Protease', '47', '0', 'I', 'V', 'IDV'),
('5', '104', 'Protease', '47', '0', 'I', 'V', 'LPV'),
('5', '104', 'Protease', '47', '0', 'I', 'V', 'NFV'),
('5', '104', 'Protease', '47', '0', 'I', 'V', 'TPV'),
('5', '104', 'Protease', '47', '0', 'I', 'A', 'DRV'),
('5', '104', 'Protease', '47', '0', 'I', 'A', 'FPV'),
('5', '104', 'Protease', '47', '0', 'I', 'A', 'LPV'),
('5', '104', 'Protease', '48', '0', 'G', 'V', 'ATV'),
('5', '104', 'Protease', '48', '0', 'G', 'V', 'LPV'),
('5', '104', 'Protease', '48', '0', 'G', 'V', 'NFV'),
('5', '104', 'Protease', '48', '0', 'G', 'V', 'SQV'),
('5', '104', 'Protease', '48', '0', 'G', 'M', 'ATV'),
('5', '104', 'Protease', '48', '0', 'G', 'M', 'LPV'),
('5', '104', 'Protease', '48', '0', 'G', 'M', 'NFV'),
('5', '104', 'Protease', '48', '0', 'G', 'M', 'SQV'),
('5', '104', 'Protease', '50', '0', 'I', 'L', 'ATV'),
('5', '104', 'Protease', '50', '0', 'I', 'V', 'DRV'),
('5', '104', 'Protease', '50', '0', 'I', 'V', 'FPV'),
('5', '104', 'Protease', '50', '0', 'I', 'V', 'LPV'),
('5', '104', 'Protease', '53', '0', 'F', 'L', 'ATV'),
('5', '104', 'Protease', '53', '0', 'F', 'L', 'IDV'),
('5', '104', 'Protease', '53', '0', 'F', 'L', 'NFV'),
('5', '104', 'Protease', '53', '0', 'F', 'L', 'SQV'),
('5', '104', 'Protease', '54', '0', 'I', 'V', 'ATV'),
('5', '104', 'Protease', '54', '0', 'I', 'V', 'FPV'),
('5', '104', 'Protease', '54', '0', 'I', 'V', 'IDV'),
('5', '104', 'Protease', '54', '0', 'I', 'V', 'LPV'),
('5', '104', 'Protease', '54', '0', 'I', 'V', 'NFV'),
('5', '104', 'Protease', '54', '0', 'I', 'V', 'SQV'),
('5', '104', 'Protease', '54', '0', 'I', 'V', 'TPV'),
('5', '104', 'Protease', '54', '0', 'I', 'T', 'ATV'),
('5', '104', 'Protease', '54', '0', 'I', 'T', 'FPV'),
('5', '104', 'Protease', '54', '0', 'I', 'T', 'IDV'),
('5', '104', 'Protease', '54', '0', 'I', 'T', 'LPV'),
('5', '104', 'Protease', '54', '0', 'I', 'T', 'NFV'),
('5', '104', 'Protease', '54', '0', 'I', 'T', 'SQV'),
('5', '104', 'Protease', '54', '0', 'I', 'A', 'ATV'),
('5', '104', 'Protease', '54', '0', 'I', 'A', 'FPV'),
('5', '104', 'Protease', '54', '0', 'I', 'A', 'IDV'),
('5', '104', 'Protease', '54', '0', 'I', 'A', 'LPV'),
('5', '104', 'Protease', '54', '0', 'I', 'A', 'NFV'),
('5', '104', 'Protease', '54', '0', 'I', 'A', 'SQV'),
('5', '104', 'Protease', '54', '0', 'I', 'A', 'TPV'),
('5', '104', 'Protease', '54', '0', 'I', 'L', 'ATV'),
('5', '104', 'Protease', '54', '0', 'I', 'L', 'FPV'),
('5', '104', 'Protease', '54', '0', 'I', 'L', 'IDV'),
('5', '104', 'Protease', '54', '0', 'I', 'L', 'LPV'),
('5', '104', 'Protease', '54', '0', 'I', 'L', 'NFV'),
('5', '104', 'Protease', '54', '0', 'I', 'L', 'SQV'),
('5', '104', 'Protease', '54', '0', 'I', 'L', 'DRV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'ATV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'FPV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'IDV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'LPV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'NFV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'SQV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'DRV'),
('5', '104', 'Protease', '54', '0', 'I', 'M', 'TPV'),
('5', '104', 'Protease', '73', '0', 'G', 'S', 'ATV'),
('5', '104', 'Protease', '73', '0', 'G', 'S', 'DRV'),
('5', '104', 'Protease', '73', '0', 'G', 'S', 'FPV'),
('5', '104', 'Protease', '73', '0', 'G', 'S', 'IDV'),
('5', '104', 'Protease', '73', '0', 'G', 'S', 'NFV'),
('5', '104', 'Protease', '73', '0', 'G', 'S', 'SQV'),
('5', '104', 'Protease', '73', '0', 'G', 'T', 'ATV'),
('5', '104', 'Protease', '73', '0', 'G', 'T', 'DRV'),
('5', '104', 'Protease', '73', '0', 'G', 'T', 'FPV'),
('5', '104', 'Protease', '73', '0', 'G', 'T', 'IDV'),
('5', '104', 'Protease', '73', '0', 'G', 'T', 'NFV'),
('5', '104', 'Protease', '73', '0', 'G', 'T', 'SQV'),
('5', '104', 'Protease', '76', '0', 'L', 'V', 'DRV'),
('5', '104', 'Protease', '76', '0', 'L', 'V', 'FPV'),
('5', '104', 'Protease', '76', '0', 'L', 'V', 'IDV'),
('5', '104', 'Protease', '76', '0', 'L', 'V', 'LPV'),
('5', '104', 'Protease', '82', '0', 'V', 'A', 'ATV'),
('5', '104', 'Protease', '82', '0', 'V', 'A', 'FPV'),
('5', '104', 'Protease', '82', '0', 'V', 'A', 'IDV'),
('5', '104', 'Protease', '82', '0', 'V', 'A', 'LPV'),
('5', '104', 'Protease', '82', '0', 'V', 'A', 'NFV'),
('5', '104', 'Protease', '82', '0', 'V', 'A', 'TPV'),
('5', '104', 'Protease', '82', '0', 'V', 'A', 'SQV'),
('5', '104', 'Protease', '82', '0', 'V', 'T', 'ATV'),
('5', '104', 'Protease', '82', '0', 'V', 'T', 'FPV'),
('5', '104', 'Protease', '82', '0', 'V', 'T', 'IDV'),
('5', '104', 'Protease', '82', '0', 'V', 'T', 'LPV'),
('5', '104', 'Protease', '82', '0', 'V', 'T', 'NFV'),
('5', '104', 'Protease', '82', '0', 'V', 'T', 'TPV'),
('5', '104', 'Protease', '82', '0', 'V', 'T', 'SQV'),
('5', '104', 'Protease', '82', '0', 'V', 'F', 'ATV'),
('5', '104', 'Protease', '82', '0', 'V', 'F', 'FPV'),
('5', '104', 'Protease', '82', '0', 'V', 'F', 'IDV'),
('5', '104', 'Protease', '82', '0', 'V', 'F', 'LPV'),
('5', '104', 'Protease', '82', '0', 'V', 'F', 'NFV'),
('5', '104', 'Protease', '82', '0', 'V', 'F', 'TPV'),
('5', '104', 'Protease', '82', '0', 'V', 'S', 'ATV'),
('5', '104', 'Protease', '82', '0', 'V', 'S', 'FPV'),
('5', '104', 'Protease', '82', '0', 'V', 'S', 'IDV'),
('5', '104', 'Protease', '82', '0', 'V', 'S', 'LPV'),
('5', '104', 'Protease', '82', '0', 'V', 'S', 'NFV'),
('5', '104', 'Protease', '82', '0', 'V', 'S', 'TPV'),
('5', '104', 'Protease', '82', '0', 'V', 'L', 'TPV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'ATV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'DRV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'FPV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'IDV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'LPV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'NFV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'SQV'),
('5', '104', 'Protease', '84', '0', 'I', 'V', 'TPV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'ATV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'DRV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'FPV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'IDV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'LPV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'NFV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'SQV'),
('5', '104', 'Protease', '84', '0', 'I', 'A', 'TPV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'ATV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'DRV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'FPV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'IDV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'LPV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'NFV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'SQV'),
('5', '104', 'Protease', '84', '0', 'I', 'C', 'TPV'),
('5', '104', 'Protease', '88', '0', 'N', 'D', 'ATV'),
('5', '104', 'Protease', '88', '0', 'N', 'D', 'NFV'),
('5', '104', 'Protease', '88', '0', 'N', 'S', 'ATV'),
('5', '104', 'Protease', '88', '0', 'N', 'S', 'IDV'),
('5', '104', 'Protease', '88', '0', 'N', 'S', 'NFV'),
('5', '104', 'Protease', '88', '0', 'N', 'S', 'SQV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'ATV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'DRV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'FPV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'IDV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'LPV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'NFV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'SQV'),
('5', '104', 'Protease', '90', '0', 'L', 'M', 'TPV'),
('5', '105', 'NRTI', '184', '0', 'M', 'V', '3TC'),
('5', '105', 'NRTI', '184', '0', 'M', 'V', 'FTC'),
('5', '105', 'NRTI', '184', '0', 'M', 'V', 'ABC'),
('5', '105', 'NRTI', '184', '0', 'M', 'V', 'DDI'),
('5', '105', 'NRTI', '184', '0', 'M', 'I', '3TC'),
('5', '105', 'NRTI', '184', '0', 'M', 'I', 'FTC'),
('5', '105', 'NRTI', '184', '0', 'M', 'I', 'ABC'),
('5', '105', 'NRTI', '184', '0', 'M', 'I', 'DDI'),
('5', '105', 'NRTI', '41', '0', 'M', 'L', 'ABC'),
('5', '105', 'NRTI', '41', '0', 'M', 'L', 'DDI'),
('5', '105', 'NRTI', '41', '0', 'M', 'L', 'TDF'),
('5', '105', 'NRTI', '41', '0', 'M', 'L', 'D4T'),
('5', '105', 'NRTI', '41', '0', 'M', 'L', 'ZDV'),
('5', '105', 'NRTI', '67', '0', 'D', 'N', 'ABC'),
('5', '105', 'NRTI', '67', '0', 'D', 'N', 'DDI'),
('5', '105', 'NRTI', '67', '0', 'D', 'N', 'TDF'),
('5', '105', 'NRTI', '67', '0', 'D', 'N', 'D4T'),
('5', '105', 'NRTI', '67', '0', 'D', 'N', 'ZDV'),
('5', '105', 'NRTI', '70', '0', 'K', 'R', 'D4T'),
('5', '105', 'NRTI', '70', '0', 'K', 'R', 'ZDV'),
('5', '105', 'NRTI', '210', '0', 'L', 'W', 'ABC'),
('5', '105', 'NRTI', '210', '0', 'L', 'W', 'DDI'),
('5', '105', 'NRTI', '210', '0', 'L', 'W', 'TDF'),
('5', '105', 'NRTI', '210', '0', 'L', 'W', 'D4T'),
('5', '105', 'NRTI', '210', '0', 'L', 'W', 'ZDV'),
('5', '105', 'NRTI', '215', '0', 'T', 'F', 'ABC'),
('5', '105', 'NRTI', '215', '0', 'T', 'F', 'DDI'),
('5', '105', 'NRTI', '215', '0', 'T', 'F', 'TDF'),
('5', '105', 'NRTI', '215', '0', 'T', 'F', 'D4T'),
('5', '105', 'NRTI', '215', '0', 'T', 'F', 'ZDV'),
('5', '105', 'NRTI', '215', '0', 'T', 'Y', 'ABC'),
('5', '105', 'NRTI', '215', '0', 'T', 'Y', 'DDI'),
('5', '105', 'NRTI', '215', '0', 'T', 'Y', 'TDF'),
('5', '105', 'NRTI', '215', '0', 'T', 'Y', 'D4T'),
('5', '105', 'NRTI', '215', '0', 'T', 'Y', 'ZDV'),
('5', '105', 'NRTI', '219', '0', 'K', 'Q', 'D4T'),
('5', '105', 'NRTI', '219', '0', 'K', 'Q', 'ZDV'),
('5', '105', 'NRTI', '219', '0', 'K', 'E', 'D4T'),
('5', '105', 'NRTI', '219', '0', 'K', 'E', 'ZDV'),
('5', '105', 'NRTI', '65', '0', 'K', 'R', '3TC'),
('5', '105', 'NRTI', '65', '0', 'K', 'R', 'FTC'),
('5', '105', 'NRTI', '65', '0', 'K', 'R', 'ABC'),
('5', '105', 'NRTI', '65', '0', 'K', 'R', 'DDI'),
('5', '105', 'NRTI', '65', '0', 'K', 'R', 'TDF'),
('5', '105', 'NRTI', '65', '0', 'K', 'R', 'D4T'),
('5', '105', 'NRTI', '65', '0', 'K', 'N', '3TC'),
('5', '105', 'NRTI', '65', '0', 'K', 'N', 'FTC'),
('5', '105', 'NRTI', '65', '0', 'K', 'N', 'ABC'),
('5', '105', 'NRTI', '65', '0', 'K', 'N', 'DDI'),
('5', '105', 'NRTI', '65', '0', 'K', 'N', 'TDF'),
('5', '105', 'NRTI', '65', '0', 'K', 'N', 'D4T'),
('5', '105', 'NRTI', '70', '0', 'K', 'E', '3TC'),
('5', '105', 'NRTI', '70', '0', 'K', 'E', 'FTC'),
('5', '105', 'NRTI', '70', '0', 'K', 'E', 'ABC'),
('5', '105', 'NRTI', '70', '0', 'K', 'E', 'DDI'),
('5', '105', 'NRTI', '70', '0', 'K', 'E', 'TDF'),
('5', '105', 'NRTI', '70', '0', 'K', 'G', '3TC'),
('5', '105', 'NRTI', '70', '0', 'K', 'G', 'FTC'),
('5', '105', 'NRTI', '70', '0', 'K', 'G', 'ABC'),
('5', '105', 'NRTI', '70', '0', 'K', 'G', 'DDI'),
('5', '105', 'NRTI', '70', '0', 'K', 'G', 'TDF'),
('5', '105', 'NRTI', '74', '0', 'L', 'V', 'ABC'),
('5', '105', 'NRTI', '74', '0', 'L', 'V', 'DDI'),
('5', '105', 'NRTI', '74', '0', 'L', 'I', 'ABC'),
('5', '105', 'NRTI', '74', '0', 'L', 'I', 'DDI'),
('5', '105', 'NRTI', '75', '0', 'V', 'T', 'ABC'),
('5', '105', 'NRTI', '75', '0', 'V', 'T', 'DDI'),
('5', '105', 'NRTI', '75', '0', 'V', 'T', 'D4T'),
('5', '105', 'NRTI', '75', '0', 'V', 'M', 'ABC'),
('5', '105', 'NRTI', '75', '0', 'V', 'M', 'DDI'),
('5', '105', 'NRTI', '75', '0', 'V', 'M', 'TDF'),
('5', '105', 'NRTI', '75', '0', 'V', 'M', 'D4T'),
('5', '105', 'NRTI', '115', '0', 'Y', 'F', 'ABC'),
('5', '105', 'NRTI', '115', '0', 'Y', 'F', 'TDF'),
('5', '105', 'NRTI', '69', '1', '-', 'X', '3TC'),
('5', '105', 'NRTI', '69', '1', '-', 'X', 'FTC'),
('5', '105', 'NRTI', '69', '1', '-', 'X', 'ABC'),
('5', '105', 'NRTI', '69', '1', '-', 'X', 'DDI'),
('5', '105', 'NRTI', '69', '1', '-', 'X', 'TDF'),
('5', '105', 'NRTI', '69', '1', '-', 'X', 'D4T'),
('5', '105', 'NRTI', '69', '1', '-', 'X', 'ZDV'),
('5', '105', 'NRTI', '151', '0', 'Q', 'M', '3TC'),
('5', '105', 'NRTI', '151', '0', 'Q', 'M', 'FTC'),
('5', '105', 'NRTI', '151', '0', 'Q', 'M', 'ABC'),
('5', '105', 'NRTI', '151', '0', 'Q', 'M', 'DDI'),
('5', '105', 'NRTI', '151', '0', 'Q', 'M', 'TDF'),
('5', '105', 'NRTI', '151', '0', 'Q', 'M', 'D4T'),
('5', '105', 'NRTI', '151', '0', 'Q', 'M', 'ZDV'),
('5', '105', 'NRTI', '62', '0', 'A', 'V', '3TC'),
('5', '105', 'NRTI', '62', '0', 'A', 'V', 'FTC'),
('5', '105', 'NRTI', '62', '0', 'A', 'V', 'ABC'),
('5', '105', 'NRTI', '62', '0', 'A', 'V', 'DDI'),
('5', '105', 'NRTI', '62', '0', 'A', 'V', 'TDF'),
('5', '105', 'NRTI', '62', '0', 'A', 'V', 'D4T'),
('5', '105', 'NRTI', '62', '0', 'A', 'V', 'ZDV'),
('5', '105', 'NRTI', '75', '0', 'V', 'I', 'ABC'),
('5', '105', 'NRTI', '75', '0', 'V', 'I', 'DDI'),
('5', '105', 'NRTI', '75', '0', 'V', 'I', 'D4T'),
('5', '105', 'NRTI', '75', '0', 'V', 'I', 'ZDV'),
('5', '105', 'NRTI', '77', '0', 'F', 'L', 'ABC'),
('5', '105', 'NRTI', '77', '0', 'F', 'L', 'DDI'),
('5', '105', 'NRTI', '77', '0', 'F', 'L', 'D4T'),
('5', '105', 'NRTI', '77', '0', 'F', 'L', 'ZDV'),
('5', '105', 'NRTI', '116', '0', 'F', 'Y', 'ABC'),
('5', '105', 'NRTI', '116', '0', 'F', 'Y', 'DDI'),
('5', '105', 'NRTI', '116', '0', 'F', 'Y', 'D4T'),
('5', '105', 'NRTI', '116', '0', 'F', 'Y', 'ZDV'),
('5', '105', 'NNRTI', '98', '0', 'A', 'G', 'NVP'),
('5', '105', 'NNRTI', '98', '0', 'A', 'G', 'DLV'),
('5', '105', 'NNRTI', '98', '0', 'A', 'G', 'EFV'),
('5', '105', 'NNRTI', '98', '0', 'A', 'G', 'ETR'),
('5', '105', 'NNRTI', '100', '0', 'L', 'I', 'NVP'),
('5', '105', 'NNRTI', '100', '0', 'L', 'I', 'DLV'),
('5', '105', 'NNRTI', '100', '0', 'L', 'I', 'EFV'),
('5', '105', 'NNRTI', '100', '0', 'L', 'I', 'ETR'),
('5', '105', 'NNRTI', '101', '0', 'K', 'E', 'NVP'),
('5', '105', 'NNRTI', '101', '0', 'K', 'E', 'DLV'),
('5', '105', 'NNRTI', '101', '0', 'K', 'E', 'EFV'),
('5', '105', 'NNRTI', '101', '0', 'K', 'E', 'ETR'),
('5', '105', 'NNRTI', '101', '0', 'K', 'P', 'NVP'),
('5', '105', 'NNRTI', '101', '0', 'K', 'P', 'DLV'),
('5', '105', 'NNRTI', '101', '0', 'K', 'P', 'EFV'),
('5', '105', 'NNRTI', '101', '0', 'K', 'P', 'ETR'),
('5', '105', 'NNRTI', '103', '0', 'K', 'N', 'NVP'),
('5', '105', 'NNRTI', '103', '0', 'K', 'N', 'DLV'),
('5', '105', 'NNRTI', '103', '0', 'K', 'N', 'EFV'),
('5', '105', 'NNRTI', '103', '0', 'K', 'S', 'NVP'),
('5', '105', 'NNRTI', '103', '0', 'K', 'S', 'DLV'),
('5', '105', 'NNRTI', '103', '0', 'K', 'S', 'EFV'),
('5', '105', 'NNRTI', '106', '0', 'V', 'A', 'NVP'),
('5', '105', 'NNRTI', '106', '0', 'V', 'A', 'DLV'),
('5', '105', 'NNRTI', '106', '0', 'V', 'A', 'EFV'),
('5', '105', 'NNRTI', '106', '0', 'V', 'M', 'NVP'),
('5', '105', 'NNRTI', '106', '0', 'V', 'M', 'DLV'),
('5', '105', 'NNRTI', '106', '0', 'V', 'M', 'EFV'),
('5', '105', 'NNRTI', '108', '0', 'V', 'I', 'NVP'),
('5', '105', 'NNRTI', '108', '0', 'V', 'I', 'DLV'),
('5', '105', 'NNRTI', '108', '0', 'V', 'I', 'EFV'),
('5', '105', 'NNRTI', '179', '0', 'V', 'D', 'NVP'),
('5', '105', 'NNRTI', '179', '0', 'V', 'D', 'DLV'),
('5', '105', 'NNRTI', '179', '0', 'V', 'D', 'ETR'),
('5', '105', 'NNRTI', '179', '0', 'V', 'D', 'EFV'),
('5', '105', 'NNRTI', '179', '0', 'V', 'E', 'NVP'),
('5', '105', 'NNRTI', '179', '0', 'V', 'E', 'DLV'),
('5', '105', 'NNRTI', '179', '0', 'V', 'E', 'EFV'),
('5', '105', 'NNRTI', '179', '0', 'V', 'E', 'ETR'),
('5', '105', 'NNRTI', '179', '0', 'V', 'F', 'NVP'),
('5', '105', 'NNRTI', '179', '0', 'V', 'F', 'DLV'),
('5', '105', 'NNRTI', '179', '0', 'V', 'F', 'EFV'),
('5', '105', 'NNRTI', '179', '0', 'V', 'F', 'ETR'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'C', 'NVP'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'C', 'DLV'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'C', 'EFV'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'C', 'ETR'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'I', 'NVP'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'I', 'DLV'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'I', 'EFV'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'I', 'ETR'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'V', 'NVP'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'V', 'DLV'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'V', 'EFV'),
('5', '105', 'NNRTI', '181', '0', 'Y', 'V', 'ETR'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'L', 'NVP'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'L', 'DLV'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'L', 'EFV'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'L', 'ETR'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'H', 'NVP'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'H', 'DLV'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'H', 'EFV'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'H', 'ETR'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'C', 'NVP'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'C', 'DLV'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'C', 'EFV'),
('5', '105', 'NNRTI', '188', '0', 'Y', 'C', 'ETR'),
('5', '105', 'NNRTI', '190', '0', 'G', 'A', 'NVP'),
('5', '105', 'NNRTI', '190', '0', 'G', 'A', 'EFV'),
('5', '105', 'NNRTI', '190', '0', 'G', 'A', 'ETR'),
('5', '105', 'NNRTI', '190', '0', 'G', 'S', 'NVP'),
('5', '105', 'NNRTI', '190', '0', 'G', 'S', 'EFV'),
('5', '105', 'NNRTI', '190', '0', 'G', 'S', 'ETR'),
('5', '105', 'NNRTI', '190', '0', 'G', 'E', 'NVP'),
('5', '105', 'NNRTI', '190', '0', 'G', 'E', 'EFV'),
('5', '105', 'NNRTI', '190', '0', 'G', 'E', 'ETR'),
('5', '105', 'NNRTI', '190', '0', 'G', 'E', 'DLV'),
('5', '105', 'NNRTI', '225', '0', 'P', 'H', 'EFV'),
('5', '105', 'NNRTI', '227', '0', 'F', 'L', 'NVP'),
('5', '105', 'NNRTI', '227', '0', 'F', 'C', 'NVP'),
('5', '105', 'NNRTI', '227', '0', 'F', 'C', 'DLV'),
('5', '105', 'NNRTI', '227', '0', 'F', 'C', 'EFV'),
('5', '105', 'NNRTI', '227', '0', 'F', 'C', 'ETR'),
('5', '105', 'NNRTI', '230', '0', 'M', 'L', 'NVP'),
('5', '105', 'NNRTI', '230', '0', 'M', 'L', 'DLV'),
('5', '105', 'NNRTI', '230', '0', 'M', 'L', 'EFV'),
('5', '105', 'NNRTI', '230', '0', 'M', 'L', 'ETR'),
('5', '105', 'NNRTI', '236', '0', 'P', 'L', 'DLV'),
('5', '105', 'NNRTI', '238', '0', 'K', 'T', 'NVP'),
('5', '105', 'NNRTI', '238', '0', 'K', 'T', 'DLV'),
('5', '105', 'NNRTI', '238', '0', 'K', 'T', 'EFV'),
('5', '105', 'NNRTI', '238', '0', 'K', 'T', 'ETR')
;
-- ----------------------------
-- Table structure for sequenceanalysis.virus_strains
-- ----------------------------
CREATE TABLE sequenceanalysis.virus_strains
(
virus_strain VARCHAR(45) NOT NULL,
genbank VARCHAR(45) DEFAULT NULL,
species VARCHAR(45) NOT NULL,
workbook VARCHAR(45) DEFAULT NULL,
--Container ENTITYID NOT NULL,
CreatedBy USERID,
Created TIMESTAMP,
ModifiedBy USERID,
Modified TIMESTAMP,
CONSTRAINT PK_virus_strains PRIMARY KEY (virus_strain)
)
WITH (OIDS=FALSE);
-- ----------------------------
-- Records of sequenceAnalysis.virus_strains
-- ----------------------------
INSERT INTO sequenceanalysis.virus_strains
(virus_strain, genbank, species, workbook)
VALUES
('SIVmac239', 'M33262', 'SIV', NULL),
('SIVmac251', 'M19499', 'SIV', NULL),
('SHIV89.6P', 'U89134', 'SIV', NULL),
('E660', NULL, 'SIV', NULL),
('HXB2', 'NC_001802', 'HIV', NULL),
('SIVmac251_CMstock', NULL, 'SIV', NULL),
('A_Kawasaki_173_2001', NULL, 'Influenza A', NULL),
('A_California_04_09', NULL, 'Influenza A', NULL),
('A_Kawasaki_UTK-04_09', NULL, 'Influenza A', NULL),