當前位置: 首頁>>代碼示例>>Python>>正文


Python SequenceCollection.read方法代碼示例

本文整理匯總了Python中skbio.SequenceCollection.read方法的典型用法代碼示例。如果您正苦於以下問題:Python SequenceCollection.read方法的具體用法?Python SequenceCollection.read怎麽用?Python SequenceCollection.read使用的例子?那麽, 這裏精選的方法代碼示例或許可以為您提供幫助。您也可以進一步了解該方法所在skbio.SequenceCollection的用法示例。


在下文中一共展示了SequenceCollection.read方法的6個代碼示例,這些例子默認根據受歡迎程度排序。您可以為喜歡或者感覺有用的代碼點讚,您的評價將有助於係統推薦出更棒的Python代碼示例。

示例1: extract_seq_ids

# 需要導入模塊: from skbio import SequenceCollection [as 別名]
# 或者: from skbio.SequenceCollection import read [as 別名]
def extract_seq_ids(data, fmt='fasta', variant=None):
    """
    Given FASTQ-format data (string), parse out only the
    sequence IDs and return.
    """
    fh = StringIO(data)
    if fmt == 'fastq':
        sc = SequenceCollection.read(fh, format=fmt, variant=variant)
    else:
        sc = SequenceCollection.read(fh, format=fmt)
    return frozenset(entry.id for entry in sc)
開發者ID:3009420,項目名稱:PyMGRAST,代碼行數:13,代碼來源:filter_failed_screening.py

示例2: convert_phylip

# 需要導入模塊: from skbio import SequenceCollection [as 別名]
# 或者: from skbio.SequenceCollection import read [as 別名]
def convert_phylip(infile, outfile, format):
    seqs = SequenceCollection.read(
        infile, format='phylip',
        data_parser=phylip.relaxed_ids
    )

    seqs.write(outfile, format=format)
開發者ID:sh4wn,項目名稱:af-phylogeny,代碼行數:9,代碼來源:phylip-splitter.py

示例3: main

# 需要導入模塊: from skbio import SequenceCollection [as 別名]
# 或者: from skbio.SequenceCollection import read [as 別名]
def main():
    args = handle_program_options()

    if osp.isfile(args.out_dir):
        print("--out_dir (-o) option must be a valid directory and not a file",
              file=sys.stderr)
        sys.exit(1)

    # will fail gracefully if dir exists
    skbu.create_dir(args.out_dir)

    metagenomes = []
    if args.metagenome_id is not None:
        metagenomes.append(args.metagenome_id)
    elif args.metagenome_file is not None:
        metagenomes.extend(parse_metagenome_file(args.metagenome_file))
        
    if args.verbose:
        msg = 'Processing requested for {} metagenome(s) found in: {}'
        print(msg.format(len(metagenomes), args.metagenome_file))

    # MG-RAST stage.file ids for downloading
    derep_passed = '150.1'
    screen_passed = '299.1'

    for mg_id in metagenomes:
        if args.verbose:
            print('Processing metagenome: {}'.format(mg_id))
            print('\tDownloading: Dereplication Passed...', end='')
            sys.stdout.flush()
        derepp_rsp = mgapi.mgrast_request('download', mg_id,
                                          {'file': derep_passed},
                                          auth_key=args.auth_key)
        derepp_sc = SequenceCollection.read(StringIO(derepp_rsp.text),
                                            format='fastq',
                                            variant='illumina1.8')
        if args.verbose:
            print('{} sequences'.format(len(derepp_sc)))
            print('\tDownloading: Screen Passed...', end='')
            sys.stdout.flush()
        screenp_rsp = mgapi.mgrast_request('download', mg_id,
                                           {'file': screen_passed},
                                           auth_key=args.auth_key)
        screenp_ids = extract_seq_ids(screenp_rsp.text, fmt='fastq',
                                      variant='illumina1.8')
        if args.verbose:
            print('{} sequences'.format(len(screenp_ids)))

        # filter dereplication passed with IDs from screen passed
        failed_screen = filter_seqs(derepp_sc, screenp_ids)
        if args.verbose:
            nsp = len(screenp_ids)
            print('\tRemoved {} sequences from Dereplication Passed'.format(nsp))
            print('\tleaving {} sequences'.format(len(failed_screen)))

        out_fp = osp.join(args.out_dir, mg_id + '_screen_failed.fastq')
        failed_screen.write(out_fp, format='fastq', variant='illumina1.8')
        if args.verbose:
            print('Sequence data written to: ' + out_fp)
開發者ID:3009420,項目名稱:PyMGRAST,代碼行數:61,代碼來源:filter_failed_screening.py

示例4: test_make_mini_otu_files

# 需要導入模塊: from skbio import SequenceCollection [as 別名]
# 或者: from skbio.SequenceCollection import read [as 別名]
 def test_make_mini_otu_files(self):
     os.system("mkdir tmp")
     self.extension_seqs = SequenceCollection.read(self.extension_seqs)
     result = _make_mini_otu_files(self.key_node,
                                   self.extension_genus_dic_few,
                                   self.extension_seqs)
     os.system("rm -r tmp")
     self.assertEqual(result, """>P1\nTTAAAAAA\n""")
開發者ID:wasade,項目名稱:ghost-tree,代碼行數:10,代碼來源:test_hybridtree.py

示例5: str

# 需要導入模塊: from skbio import SequenceCollection [as 別名]
# 或者: from skbio.SequenceCollection import read [as 別名]
from qiime_default_reference import get_template_alignment, get_reference_sequences

from skbio import SequenceCollection

gapped_sequences = [(s.id, str(s)) for s in SequenceCollection.read(get_template_alignment())][:500]

sequences = [(s.id, str(s)) for s in SequenceCollection.read(get_reference_sequences())][:500]

motif_1 = "GGTGCAAGCCGGTGGAAACA"
開發者ID:bctaylor,項目名稱:sequence-benchmarks,代碼行數:11,代碼來源:test_data.py

示例6: get_argument_parser

# 需要導入模塊: from skbio import SequenceCollection [as 別名]
# 或者: from skbio.SequenceCollection import read [as 別名]
    log_choices = ["DEBUG", "INFO", "WARNING", "ERROR", "CRITICAL"]
    parser.add_argument(
        '--log-level', '-l', default="INFO", choices=log_choices,
        help="Set logging level. Default is info."
    )

    return parser

if __name__ == '__main__':
    parser = get_argument_parser()
    args = parser.parse_args()

    level = getattr(logging, args.log_level.upper(), logging.INFO)
    logging.basicConfig(level=level)

    sequences = SequenceCollection.read(args.infile, format=args.format)

    if args.parallel == 0 and len(sequences) > 16:
        pool_size = multiprocessing.cpu_count()
    else:
        pool_size = 1

    dmatrix = create_distance_matrix(sequences, d2.distance, pool_size,
                                     statistic=d2.d2_neighbourhood_dna)

    print(dmatrix)
    phylo_tree = nj(dmatrix)
    print(phylo_tree.ascii_art())
    phylo_tree.write(args.outfile, format=args.target)
開發者ID:sh4wn,項目名稱:af-phylogeny,代碼行數:31,代碼來源:af-phylogeny.py


注:本文中的skbio.SequenceCollection.read方法示例由純淨天空整理自Github/MSDocs等開源代碼及文檔管理平台,相關代碼片段篩選自各路編程大神貢獻的開源項目,源碼版權歸原作者所有,傳播和使用請參考對應項目的License;未經允許,請勿轉載。