mohsennezhad
/
ThyroidProject


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687
							import concurrent.futures
import concurrent.futures
import time
from urllib.error import HTTPError
from urllib.request import urlretrieve

from torch.utils.data import IterableDataset
from tqdm import tqdm

from config import Config


def find_in_log_n(start, end, func, bias=0.3):
    if end - start <= 1:
        return start
    mid = int(start * (1 - bias) + end * bias)
    if start == mid:
        mid += 1
    if func(mid):
        return find_in_log_n(mid, end, func)
    else:
        return find_in_log_n(start, mid, func)


def fetch_tile_content(tile_url, retry=15):
    for i in range(retry):
        try:
            image_path = urlretrieve(tile_url)[0]
            with open(image_path, "rb") as file:
                return file.read()
        except Exception as e:
            print("e", end="|")
            time.sleep(2 ** (0.3 * (i + 1)))
            if i == retry - 1:
                if input("continue") == "y":
                    return fetch_tile_content(tile_url, retry)
                raise e
    raise HTTPError("Not able for fetch image tile", code=500, msg="", hdrs={}, fp=None)


def download_urls_in_thread(url_and_index_list):
    def download(args):
        url, index = args
        file_content = fetch_tile_content(url)
        return file_content, index

    with concurrent.futures.ThreadPoolExecutor(max_workers=Config.workers) as executor:
        for tile, i in tqdm(executor.map(download, url_and_index_list), total=len(url_and_index_list)):
            yield tile, i


def _get_alignment_sore_and_percent(seq1, seq2, match_score=2, mismatch_score=-1, gap_score=-1):
    from alignment.sequence import Sequence
    from alignment.sequencealigner import SimpleScoring, GlobalSequenceAligner
    from alignment.vocabulary import Vocabulary
    a = Sequence(seq1)
    b = Sequence(seq2)

    v = Vocabulary()
    aEncoded = v.encodeSequence(a)
    bEncoded = v.encodeSequence(b)

    scoring = SimpleScoring(match_score, mismatch_score)
    aligner = GlobalSequenceAligner(scoring, gap_score)
    score = aligner.align(aEncoded, bEncoded, backtrace=False)

    return score


def get_normalized_score(seq1, seq2):
    score = _get_alignment_sore_and_percent(seq1, seq2)
    return score / (len(seq2) + len(seq1))


class DatasetWithGenerator(IterableDataset):
    def __init__(self, generator):
        self.generator = generator

    def __iter__(self):
        return self.generator


if __name__ == '__main__':
    import math

    print(math.log2(1000 * 1000))
    print(find_in_log_n(0, 100, lambda x: x <= 76))