functions.py

from flask import Flask, render_template, session, request, redirect, flash, url_for, Blueprint, g

import urllib.parse
import random
import json
import re
import jinja2
import html
import config
import os.path
import os
from markdown import markdown
from bleach import clean

from datetime import datetime, timedelta
from math import log
import time

legal_chars = '01234567890abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ-_'

def thumb_exists(tid):
	if os.path.exists('static/thumbnails/thumb-%s.PNG' % str(tid)):
		if int(os.stat('static/thumbnails/thumb-%s.PNG' % str(tid)).st_size) > 10:
			return True
	return False

def rstring(length1, length2=False):
	if length2 == False:
		length2 = length1
	return ''.join([random.choice(legal_chars) for n in range(random.randint(length1, length2))])

def verify_username(username):
	if len(username) > 20 or len(username) < 1:
		return False
	for c in username:
		if c not in legal_chars:
			return False
	return True

def verify_subname(subname):
	if len(subname) > 30 or len(subname) < 1:
		return False
	for c in subname:
		if c not in legal_chars:
			return False
	return True

def convert_ied(url):
	url = url.lower()
	url = url.replace(' ', '_')
	url = url.replace('/', '')
	url = urllib.parse.quote(url)[:40]
	url = url.replace('%', '')
	return url

def post_url_parse(url):
	return urllib.parse.urlparse(url).netloc

def get_time():
	from datetime import datetime
	return datetime.now()

def time_ago(dt):
	diff = get_time() - dt
	if diff.days > 0:
		return str(int(diff.days)) + 'd'#ays ago'
	if diff.seconds < 60:
		return str(int(diff.seconds)) + 's'#econds ago'
	if diff.seconds > 60 and diff.seconds < 3600:
		return str(int(diff.seconds / 60)) + 'm'#inutes ago'
	if diff.seconds > 3600 and diff.seconds < 86400:
		return str(int((diff.seconds / 60) / 60)) + 'h'#ours ago'

# horribly ineffecient function lol
# like no seriously, this is really, really bad
# will change after release
def create_id_tree(comments, parent_id=None):
	tree = {}
	if not parent_id:
		for i in [c for c in comments if c.parent_id == None]:
			tree[i.id] = {}
	else:
		tree[int(parent_id)] = {}

	paths = {0:['tree']}
	depth = 0
	limit = 50
	while len(comments) > 0:
		paths[depth+1] = []
		if depth == 0:
			for z in tree.keys():
				paths[1].append('tree[' + str(z) + ']')
				comments = [a for a in comments if a.id != z]
		else:
			for p in paths[depth-1]:
				for com in [c for c in comments]:
					try:
						exec(p + '[' + str(com.parent_id ) + ']')
						exec_txt = p + '[' + str(com.parent_id ) + '][' + str(com.id) + '] = {}'
						exec(exec_txt)
						paths[depth].append(p + '[' + str(com.parent_id ) + ']')
						comments.remove(com)
					except KeyError as e:
						pass

		depth += 1
		if depth >= limit:
			break

	return tree

def recursive_items(dictionary):
	for key, value in dictionary.items():
		if type(value) is dict:
			yield from recursive_items(value)
		else:
			yield (key, value)

def comment_structure(comments, tree):
	new = {}
	for k, v in tree.items():
		cobj = next((x for x in comments if x.id == k), None)
		new[cobj] = comment_structure(comments, v)
	return new

# i hate math
def split_link(sst, s):
	new_s = []
	sindex = s.find(sst[0])
	new_s.append(s[:sindex-1])
	new_s.append(s[sindex:sindex + len(sst[0])])
	sindex = s.find(sst[1])  
	new_s.append(s[(sindex):sindex+len(sst[1])])
	new_s.append(s[sindex+len(sst[1])+1:])
	return new_s

def get_tag_count(text):
	
	
	tag_count = len(re.findall('<[a-zA-Z0-9]*>[^<>"\']*<\/[a-zA-Z0-9]*>', text))
	tag_count += text.count('<br>')
	if text.find('\n') != -1:
		tag_count += text.count('\n')
	elif text.find('\r\n') != -1:
		tag_count += text.count('\r\n')

	
	return tag_count

def pseudo_markup(text):
	
	# preserve more than 1 newline
	text_len = len(text)
	mtext = text.splitlines()

	# if text is too long, too many tagss, etc
	text = html.escape(text).replace('&lt;br&gt;', '').replace('\n', '<br>')

	max_escaped_len = 40000
	max_tag_count = 500
	current_tag_count = 0
	current_len = 0

	for i in range(0, len(mtext)):
		mtext[i] = clean(markdown(mtext[i]), strip=True) 

		regstrs = ['<[^liu].*>.*<\/[^liu]>', '^<[^liu].*>', '<\/[^liu].*>$']

		reg2 = ['<li>.*<\/li>', '<ul>.*<\/ul>', '<code>.*<\/code>', '<blockquote>.*<\/blockquote>']

		addbr = True
		addbr2 = True

		for reg in regstrs:
				if len(re.findall(reg, mtext[i])) != 0:
					addbr2 = True
					for r2 in reg2:
						if len(re.findall(r2, mtext[i])) != 0:
							addbr2 = False
				else:
					addbr = True

		if addbr and addbr2:
			if len(re.findall('^https?:\/\/.*.*$', mtext[i])) == 0:
					mtext[i] = mtext[i] + '<br>'

		current_len += len(mtext[i])
		current_tag_count += get_tag_count(mtext[i])

		
		if current_len >= max_escaped_len or current_tag_count >= max_tag_count:
			return text

	# code tags
	start, end = 0, 0
	found = False

	for i in range(len(mtext)):
		if mtext[i].find('```') != -1:
			#
			if not found:
				startindex = i
				start = mtext[i].find('```')
				mtext[i] = mtext[i].replace('```','')
				found = True
			else:
				end = mtext[i].find('```')
				mtext[startindex] = mtext[startindex][0:start] + '<pre class="inline-code"><code class="inner-code">' + mtext[startindex][start:]
				mtext[i] = mtext[i][0:end] + '</code></pre>' + mtext[i][end+3:]

				current_len += len(mtext[startindex])
				current_len += len(mtext[i])

				found = False
				start = 0
				end = 0

		current_len += len(mtext[i])
		current_tag_count += get_tag_count(mtext[i])
		
		
		if current_len >= max_escaped_len or current_tag_count >= max_tag_count:
			return text

	for i in range(len(mtext)):
		# different variations of possible links, space at start, no
		# space, etc 
		links = re.findall(' https?:\/\/.*\.\S+ ', mtext[i])

		if len(links) > 0:
			for link in links:
				mtext[i] = mtext[i].replace(link, ' <a href="%s">%s</a> ' % (html.escape(link).replace(' ', ''), html.escape(link).replace(' ', '')))
		

		links = re.findall('^https?:\/\/.*\.\S+ ', mtext[i])		
		if len(links) > 0:
			for link in links:
				mtext[i] = mtext[i].replace(link, '<a href="%s">%s</a> ' % (html.escape(link).replace(' ', ''), html.escape(link).replace(' ', '')))
		

		links = re.findall('^https?:\/\/.*\.\S+$', mtext[i])		
		if len(links) > 0:
			for link in links:
				mtext[i] = mtext[i].replace(link, '<a href="%s">%s</a>' % (html.escape(link).replace(' ', ''), html.escape(link).replace(' ', '')))		
		

		links = re.findall(' https?:\/\/.*\.\S+$', mtext[i])		
		if len(links) > 0:
			for link in links:
				mtext[i] = mtext[i].replace(link, '<a href="%s"> %s</a>' % (html.escape(link).replace(' ', ''), html.escape(link).replace(' ', '')))	
		

		links = re.findall(' https?:\/\/.*\.\S+$', mtext[i])		
		if len(links) > 0:
			for link in links:
				mtext[i] = mtext[i].replace(link, '<a href="%s"> %s</a>' % (html.escape(link).replace(' ', ''), html.escape(link).replace(' ', '')))	


		if mtext[i].find('<br>') == -1:
			if len(re.findall('$<a> href=".*"<br>', mtext[i])) == 0:
				mtext[i] += '<br>'

		current_len += len(mtext[i])
		current_tag_count += get_tag_count(mtext[i])
		
		if current_len >= max_escaped_len or current_tag_count >= max_tag_count:
			return text

	mtext = '\n'.join([x for x in mtext])


	repstrings = ['</blockquote>']
	for i in range(len(mtext)):
		if i > 0:
			past = mtext[i-1]
			for rep in repstrings:
				if past.find(rep) == -1:
					pass
				else:
					mtext[i].replace('<br>', '')


	mtext = mtext.replace('\n<div class="inline-code"><code>\n', '<div class="inline-code"><code>')
	mtext = mtext.replace('<code>\n', '<code>')
	mtext = mtext.replace('\n</code></div>\n', '</code></div>')
	#mtext = mtext.replace('\n\n</code>', '</code>')
	mtext = mtext.replace('\n</code>', '</code>')
	#mtext = mtext.replace('</code>\n<code>', '</code><code>')
	#mtext = mtext.replace('</code>\n', '</code>')

	#mtext = mtext.replace('\n<code>', '\n    </code>')
	mtext = mtext.replace('<code>', '<code>&nbsp;&nbsp;&nbsp;&nbsp;')

	mtext = mtext.replace('</blockquote>\n<br>', '</blockquote>\n')
	mtext = mtext.replace('</blockquote><br>', '</blockquote>')

	mtext = mtext.replace('</pre><br>', '</pre>')


	mtext = mtext.replace('<br>' +'</a>', '')
	mtext = mtext.replace('<br>">', '">')
	mtext = mtext.replace('&lt;br&gt;">', '">')
	mtext = mtext.replace('&amp;lt;br&amp;gt;', '')
	mtext = mtext.replace('</a></a>', '')
	mtext = mtext.replace('&lt;/a&gt;">', '">')
	mtext = mtext.replace('&lt;/a&gt;</a>', '</a>')

	if mtext == '':
		return '<br>'
	
	return mtext

epoch = datetime(1970, 1, 1)

def epoch_seconds(date):
	td = date - epoch
	return td.days * 86400 + td.seconds + (float(td.microseconds) / 1000000)

def score(ups, downs):
	return ups - downs

def hot(ups, downs, date):
	s = score(ups, downs)
	order = log(max(abs(s), 1), 10)
	sign = 1 if s > 0 else -1 if s < 0 else 0
	seconds = epoch_seconds(date) - 1134028003
	return round(sign * order + seconds / 45000, 7)

def get_youtube_vid_id(url):
	if url == None:
		return False
	if url.find('youtube.com/watch?v=') != -1:
		return url.split('=')[1]
	if url.find('youtube.com/v/') != -1:
			url = url.split('/v/')[1]
			if url.find('?') == -1:
					return url.split('?')[0]
			else:
				return url
	if url.find('youtu.be/') != -1:
		return url.split('.be/')[1]

	return False