Commit 3223df45 authored by Marine Bergot's avatar Marine Bergot

Upload New File

parent a4069159
#! /usr/bin/env python3
# -*- coding: utf-8 -*-
import sys
genes_list = set()
with open(sys.argv[1]) as bed_file:
for line in bed_file:
name = line.strip().split(";")
if len(name) < 6:
pass
else:
name = line.strip().split(";")[5].split()[1]
if "havana" not in name and "ensembl" not in name and "protein_coding" not in name:
genes_list.add(name)
with open(sys.argv[2], "w") as out_file:
for i in genes_list:
out_file.write(i)
out_file.write("\n")
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment