From 63b0fc6269b38edf7234b9f151b80d81f614c0a3 Mon Sep 17 00:00:00 2001 From: Filipp Lepalaan Date: Tue, 4 Aug 2015 10:11:24 +0300 Subject: Initial commit First public commit --- servo/lib/__init__.py | 0 servo/lib/middleware.py | 67 +++++++++++++++++++++++++ servo/lib/shorturl.py | 130 ++++++++++++++++++++++++++++++++++++++++++++++++ servo/lib/ucsv.py | 49 ++++++++++++++++++ 4 files changed, 246 insertions(+) create mode 100644 servo/lib/__init__.py create mode 100644 servo/lib/middleware.py create mode 100644 servo/lib/shorturl.py create mode 100644 servo/lib/ucsv.py (limited to 'servo/lib') diff --git a/servo/lib/__init__.py b/servo/lib/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/servo/lib/middleware.py b/servo/lib/middleware.py new file mode 100644 index 0000000..b917fa5 --- /dev/null +++ b/servo/lib/middleware.py @@ -0,0 +1,67 @@ +# -*- coding: utf-8 -*- +# Copyright (c) 2013, First Party Software +# All rights reserved. + +# Redistribution and use in source and binary forms, with or without modification, +# are permitted provided that the following conditions are met: + +# 1. Redistributions of source code must retain the above copyright notice, +# this list of conditions and the following disclaimer. + +# 2. Redistributions in binary form must reproduce the above copyright notice, +# this list of conditions and the following disclaimer in the documentation +# and/or other materials provided with the distribution. + +# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" +# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE +# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE +# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR +# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT +# OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) +# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, +# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) +# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF +# SUCH DAMAGE. + +import pytz +from re import compile +from django.conf import settings +from django.utils import timezone +from django.http import HttpResponseRedirect + + +if hasattr(settings, 'LOGIN_EXEMPT_URLS'): + EXEMPT_URLS = [compile(expr) for expr in settings.LOGIN_EXEMPT_URLS] + + +class LoginRequiredMiddleware(object): + """ + Middleware that requires a user to be authenticated to view any page other + than LOGIN_URL. Exemptions to this requirement can optionally be specified + in settings via a list of regular expressions in LOGIN_EXEMPT_URLS (which + you can copy from your urls.py). + + Requires authentication middleware and template context processors to be + loaded. You'll get an error if they aren't. + """ + def process_request(self, request): + assert hasattr(request, 'user'), "The Login Required middleware\ + requires authentication middleware to be installed. Edit your\ + MIDDLEWARE_CLASSES setting to insert\ + 'django.contrib.auth.middlware.AuthenticationMiddleware'. If that doesn't\ + work, ensure your TEMPLATE_CONTEXT_PROCESSORS setting includes\ + 'django.core.context_processors.auth'." + if not request.user.is_authenticated(): + path = request.path_info.lstrip('/') + if not any(m.match(path) for m in EXEMPT_URLS): + return HttpResponseRedirect(settings.LOGIN_URL) + + +class TimezoneMiddleware(object): + def process_request(self, request): + tzname = request.session.get('django_timezone') + if tzname: + timezone.activate(pytz.timezone(tzname)) + else: + timezone.deactivate() diff --git a/servo/lib/shorturl.py b/servo/lib/shorturl.py new file mode 100644 index 0000000..f93028f --- /dev/null +++ b/servo/lib/shorturl.py @@ -0,0 +1,130 @@ +''' +Short URL Generator +=================== + +Python implementation for generating Tiny URL- and bit.ly-like URLs. + +A bit-shuffling approach is used to avoid generating consecutive, predictable +URLs. However, the algorithm is deterministic and will guarantee that no +collisions will occur. + +The URL alphabet is fully customizable and may contain any number of +characters. By default, digits and lower-case letters are used, with +some removed to avoid confusion between characters like o, O and 0. The +default alphabet is shuffled and has a prime number of characters to further +improve the results of the algorithm. + +The block size specifies how many bits will be shuffled. The lower BLOCK_SIZE +bits are reversed. Any bits higher than BLOCK_SIZE will remain as is. +BLOCK_SIZE of 0 will leave all bits unaffected and the algorithm will simply +be converting your integer to a different base. + +The intended use is that incrementing, consecutive integers will be used as +keys to generate the short URLs. For example, when creating a new URL, the +unique integer ID assigned by a database could be used to generate the URL +by using this module. Or a simple counter may be used. As long as the same +integer is not used twice, the same short URL will not be generated twice. + +The module supports both encoding and decoding of URLs. The min_length +parameter allows you to pad the URL if you want it to be a specific length. + +Sample Usage: + +>>> import short_url +>>> url = short_url.encode_url(12) +>>> print url +LhKA +>>> key = short_url.decode_url(url) +>>> print key +12 + +Use the functions in the top-level of the module to use the default encoder. +Otherwise, you may create your own UrlEncoder object and use its encode_url +and decode_url methods. + +Author: Michael Fogleman +License: MIT +Link: http://code.activestate.com/recipes/576918/ +''' + +MIN_LENGTH = 4 +DEFAULT_BLOCK_SIZE = 24 +DEFAULT_ALPHABET = 'mn6j2c4rvbpygw9z7hsdaetxuk3fq' + +class UrlEncoder(object): + def __init__(self, alphabet=DEFAULT_ALPHABET, block_size=DEFAULT_BLOCK_SIZE): + self.alphabet = alphabet + self.block_size = block_size + self.mask = (1 << block_size) - 1 + self.mapping = range(block_size) + self.mapping.reverse() + def encode_url(self, n, min_length=MIN_LENGTH): + return self.enbase(self.encode(n), min_length) + def decode_url(self, n): + return self.decode(self.debase(n)) + def encode(self, n): + return (n & ~self.mask) | self._encode(n & self.mask) + def _encode(self, n): + result = 0 + for i, b in enumerate(self.mapping): + if n & (1 << i): + result |= (1 << b) + return result + def decode(self, n): + return (n & ~self.mask) | self._decode(n & self.mask) + def _decode(self, n): + result = 0 + for i, b in enumerate(self.mapping): + if n & (1 << b): + result |= (1 << i) + return result + def enbase(self, x, min_length=MIN_LENGTH): + result = self._enbase(x) + padding = self.alphabet[0] * (min_length - len(result)) + return '%s%s' % (padding, result) + def _enbase(self, x): + n = len(self.alphabet) + if x < n: + return self.alphabet[x] + return self._enbase(x / n) + self.alphabet[x % n] + def debase(self, x): + n = len(self.alphabet) + result = 0 + for i, c in enumerate(reversed(x)): + result += self.alphabet.index(c) * (n ** i) + return result + +DEFAULT_ENCODER = UrlEncoder() + +def encode(n): + return DEFAULT_ENCODER.encode(n) + +def decode(n): + return DEFAULT_ENCODER.decode(n) + +def enbase(n, min_length=MIN_LENGTH): + return DEFAULT_ENCODER.enbase(n, min_length) + +def debase(n): + return DEFAULT_ENCODER.debase(n) + +def encode_url(n, min_length=MIN_LENGTH): + return DEFAULT_ENCODER.encode_url(n, min_length) + +def decode_url(n): + return DEFAULT_ENCODER.decode_url(n) + +def from_time(): + from time import time + return encode_url(int(time()*1000)).upper() + +if __name__ == '__main__': + for a in range(0, 200000, 37): + b = encode(a) + c = enbase(b) + d = debase(c) + e = decode(d) + assert a == e + assert b == d + c = (' ' * (7 - len(c))) + c + print '%6d %12d %s %12d %6d' % (a, b, c, d, e) diff --git a/servo/lib/ucsv.py b/servo/lib/ucsv.py new file mode 100644 index 0000000..91b2acf --- /dev/null +++ b/servo/lib/ucsv.py @@ -0,0 +1,49 @@ +""" +Borrwed from +http://stackoverflow.com/questions/1846135/python-csv-library-with-unicode-utf-8-support-that-just-works +""" + +import csv +import codecs + +class UnicodeCsvReader(object): + def __init__(self, f, encoding="utf-8", **kwargs): + self.csv_reader = csv.reader(f, **kwargs) + self.encoding = encoding + + def __iter__(self): + return self + + def next(self): + # read and split the csv row into fields + row = self.csv_reader.next() + # now decode + return [unicode(cell, self.encoding) for cell in row] + + @property + def line_num(self): + return self.csv_reader.line_num + + +class UnicodeDictReader(csv.DictReader): + def __init__(self, f, encoding="utf-8", fieldnames=None, **kwargs): + csv.DictReader.__init__(self, f, fieldnames=fieldnames, **kwargs) + self.reader = UnicodeCsvReader(f, encoding=encoding, **kwargs) + + +def read_excel_file(f): + dialect = csv.Sniffer().sniff(codecs.EncodedFile(f, "utf-8").read(1024)) + #f.open() + return UnicodeCsvReader(codecs.EncodedFile(f, "utf-8"), + "utf-8", dialect=dialect) + +def main(): + import sys + with codecs.open(sys.argv[1], 'rUb') as csvfile: + reader = read_excel_file(csvfile) + for row in reader: + print u', '.join(row) + + +if __name__ == '__main__': + main() -- cgit v1.2.3