Skip to content

Instantly share code, notes, and snippets.

@hussius
hussius / decode_cossmo_example.py
Created April 26, 2018 11:02 — forked from hannes-brt/decode_cossmo_example.py
Function to decode a COSSMO training example in tfrecord format
def read_single_cossmo_example(serialized_example, n_tissues=1, coord_sys='rna1'):
"""Decode a single COSSMO example
coord_sys must be one of 'rna1' or 'dna0', if 'dna0' then an extra 'strand' field
must exist in the tfrecord and is extracted.
"""
assert coord_sys in ['dna0', 'rna1']
context_features = {
@hussius
hussius / preprocess_yeast_dna.py
Created June 14, 2018 12:17
Preprocess yeast DNA csv file from Genome Research paper
from pathlib import Path
import os
import sys
from fire import Fire
import numpy as np
import pandas as pd
from tqdm import tqdm
"""
* Converts images to GGB (grayscale)
* Creates subsets for training and validation
* Adds columns to indicate training or validation (useful for analysis of the deployed model)
* Adds rotated images to the dataset
* Creates comma-separated CSV file
* Creates zip archive
"""
import pandas as pd