#!/usr/bin/env python3

import argparse
import sys
import json
import os
import re
import time
import datetime
from pprint import pprint

try:
    from termcolor import cprint
    colors_supported = True
except ImportError:
    colors_supported = False

CWD = os.path.dirname(os.path.realpath(__file__))

def print_colored(s, color, fallback_prefix=''):
    if colors_supported:
        cprint(s, color)
    else:
        print(fallback_prefix + s)

def load_data():
    with open(os.path.join(CWD, "data.json")) as f:
        data = json.loads(f.read())

    # ignore placeholders
    data = list(filter(lambda i: i['text'] != '', data))
    
    return data

def clean_string(s, remove_junk=False):
    s = s.replace(')', ') ')
    s = re.sub(r'(\!|\.)([^\)])', r'\1 \2', s)
    #s = s.replace('/', ' ')
    s = s.upper()
    
    s = re.sub(r'\s+', ' ', s).strip()

    junks = [
        'ВОЕННОЕ',
        'ВЫШЕСТОЯЩИХ',
        'ПРАВО',
        'ПРАВИЛАМ ВОЙНЫ',
        'ВЫПИСКА',
        'КОНТРОЛЬ',
        'ИХ',
        'ПО',
        'НАВЫКИ',
        'С ВЫШЕСТОЯЩИМИ',
        #'ПРИСУТСТВИЕ',
        #'ЛИНЕЙНО',
        'ЗАКОННО!',
        'ПОХЛЕБКА',
        'СВЯЗЕЙ',
        'ЖУЮЩЕГО ХРЯЩИ',
        'ИНДЕКСИРОВАН БЕЗУКОРИЗНЕННО',
        'ОТКЛАДЫВАЕТСЯ ЛИНЕЙНО',
        '- ЕГО ВЕЛИЧЕСТВО',
        'ГУБЕРНИЯ',
        'С ВЫШЕСТОЯЩИМИ КОНТРОЛЬ',
        'С ЛОКАЦИИ',
        #'КАЗНЬ',
        'ГУБЕРНИЯ',
        'ПРОВЕРКИ',
        'УСТАНОВЛЕНО',
        'ПОБЕДИТЕЛЕМ',
        #'СТАЛЬНЫЕ',
        'НЕРВЫ',
        'ДАРОВАНО',
        #'ТРАНСПОРТИРОВКА',
        'ОДОБРЕНО',
        'ПРОЯВЛЕНИЯ',
        'УЗАКОНЕНО',
        'ИМЕЕТСЯ',
        'ЗНАЛ',
        'НЕ ПРИМЕЧЕНО',
        'НА СЕВЕР',
        'ПРИГОВОРИТЬ',
        'ШЕСТВУЕМ',
        'ДАГОН',
        'ДА МЕРЗНУЩИЙ',
        'КОФЕ',
        #'РЕАГИРОВАНИЕ',
        'УКАЗАНО',
        '- ВЫСОКИЙ ТИТУЛ',
        'ЗАКАЗ',
        'ЧЕРТЫ ЛИЦА',
        
        # english
        'SCHOOL ON THE RIGHT',
        'WILL NOT ALLOW',
        'FLYWHEEL',
        'TRIUMPHANTLY',
        'BEING USED',
        'NICE',
        'UMBRELLA',
        #'BIOROBOT',
        'CONSERVATISM',
        'WAS ESTABLISHED',
        'WITH A PASSWORD',
        'ANT',
        'YEAR',
        'RECOGNIZED',
        'SEARCHED'
        #'LEGAL',
        #'FIGHTING'
    ]

    # только без пробелов
    junks_words = list(filter(lambda w: ' ' not in w, junks))

    # только с пробелами
    junks_nwords = list(filter(lambda w: w not in junks_words, junks))

    if remove_junk:
        s = s.split(' ')
        s = list(filter(lambda l: re.sub(r'\.|\!$', '', l) not in junks_words, s))
        s = ' '.join(s)

        for j in junks_nwords:
            s = s.replace(j, '')

        # хортица - это буква Х
        s = s.replace('Х О Р Т И Ц А', 'Х_О_Р_Т_И_Ц_А')
    
    s = re.sub(r'\s+', ' ', s).strip()
    return s

def decode(s, is_url=False):
    buf = ''
    for word in s.split(' '):
        word = word.strip()
        if word == '':
            continue

        if re.match(r'^\d+', word):
            buf += word
        elif is_url and word.endswith('://'):
            buf += word[0]
            buf += '://'
        else:
            letter = word[0]
            buf += letter
    
    return buf

def decode2(s):
    buf = ''
    for s in re.split(r'[\?\.\!]+', s):
        s = s.strip()
        if s == '':
            continue

        words = s.split(' ')

        letter = words[1][0]
        buf += letter

    return buf

def decode3(s):
    buf = ''
    for s in re.split(r'[\?\.\!]+', s):
        s = s.strip()
        s = s.replace(' ', '')
        s = s.replace('-', '')
        if not s:
            continue

        print(s)
        continue

        s = s.upper()

        if s[0] in ('Ш', 'Щ', 'И'):
            buf += s[0]
        elif s[4] == 'Й':
            buf += s[4]
        elif s[0] == 'И':
            buf += 'И'
        elif s[7] == 'М':
            buf += 'М'
        elif s[4] == 'А':
            buf += 'А'
        elif s[2] == 'Р':
            buf += 'Р'
        elif s[1] == 'У':
            buf += 'У'
        elif s[9] == 'Ю':
            buf += 'Ю'
        else:
            buf += '?'

    return buf


# s: source
# t: type
def decode_auto(s, t, reverse_decoded=False, remove_junk=True):
    if t == 1:
        s = clean_string(s, remove_junk=remove_junk)
        result = decode(s)
    
    elif t == 2:
        result = decode2(s)

    elif t == 3:
        result = decode3(s)

    if reverse_decoded:
        # reverse string
        result = result[::-1]

    return result


def sort_data_by_date(item):
    return int(time.mktime(datetime.datetime.strptime(item['date'], '%d/%m/%y').timetuple()))

        
def main():
    parser = argparse.ArgumentParser()
    parser.add_argument('--decode', action='store_true')
    parser.add_argument('--stats', action='store_true')
    parser.add_argument('--decode-string')
    parser.add_argument('--decode-file')
    parser.add_argument('--with-junk', action='store_true')
    parser.add_argument('--is-url', action='store_true')
    parser.add_argument('--type', type=int, choices=[1, 2, 3], default=1)
    parser.add_argument('--reverse-decoded', action='store_true')
    parser.add_argument('--gen-page', action='store_true')

    args = parser.parse_args()
    data = load_data()
  
    if args.decode:
        # filter by type
        if args.type == 2:
            data = list(filter(lambda i: 'type' in i and i['type'] == 2, data))
        else:
            data = list(filter(lambda i: 'type' not in i, data))   

        # sort by text length
        data = sorted(data, key=lambda i: len(i['text']))
        
        for obj in data:
            text = obj['text']
            text_decoded = decode_auto(text,
                                      args.type,
                                      remove_junk=(not args.with_junk),
                                      reverse_decoded=args.reverse_decoded)
         
            # print all information
            print(obj['text'])
            print_colored(text, 'green', fallback_prefix='[CLEANED] ')
            print_colored(text_decoded, 'cyan', fallback_prefix='[DECODED] ')
            
            if 'pic' in obj:
                pic = obj['pic'] if isinstance(obj['pic'], list) else [obj['pic']]
                print_colored(', '.join(pic), 'red', fallback_prefix='[PICS] ')
            if 'link' in obj:
                print_colored(obj['link'], 'red', fallback_prefix='[LINK] ')

            print("\n")

    elif args.decode_string or args.decode_file:
        if args.decode_string:
            source = args.decode_string
        else: 
            with open(args.decode_file, 'r') as f:
                source = f.read()

        text_decoded = decode_auto(source,
                                   args.type,
                                   remove_junk=(not args.with_junk),
                                   reverse_decoded=args.reverse_decoded)
        
        # print
        print_colored(text_decoded, 'cyan', fallback_prefix='[DECODED] ')
            
    elif args.stats:
        count = len(data)
        print("Total texts: %s" % count)

    elif args.gen_page:
        # sort by date
        data = sorted(data, key=sort_data_by_date)
        #pprint(data)

        buf = []
        for post in data:
            cipher_type = post['type'] if 'type' in post else 1
            decoded_text = decode_auto(post['text'], cipher_type)

            post_buf = ''
            post_buf += '**Дата**: %s\n' % post['date']

            if 'pic' in post and post['pic']:
                # make sure it is a list
                pic = post['pic'] if isinstance(post['pic'], list) else [post['pic']]

                pic_buf = []
                for p in pic:
                    pic_buf.append('![](./img/%s =300x)' % p)
                post_buf += '**Пикрилейтед:** %s\n' % ''.join(pic_buf)

            if 'link' in post:
                # make sure it is a list
                link = post['link'] if isinstance(post['link'], list) else [post['link']]

                link_buf = []
                for l in link:
                    link_buf.append('[%s](%s)' % (l, l))
                post_buf += '**Ссылки:** %s\n' % ', '.join(link_buf)

            if 'source' in post:
                post_buf += '**Источник:** %s' % post['source']
                if 'source_link' in post:
                    post_buf += ', [%s](%s)\n' % (post['source_link'], post['source_link'])
                else:
                    post_buf += '\n'

            post_buf += '**Шифровка (тип %d)**: \n```\n%s\n```\n' % (cipher_type, post['text'])
            post_buf += '**Расшифровка:** \n```\n%s\n```' % decoded_text
            
            buf.append(post_buf)

        md = "\n---\n".join(buf)
        with open(os.path.join(CWD, 'data.md'), 'w') as f:
            f.write(md)

if __name__ == '__main__':
    sys.exit(main())