summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorMaksim A. Boyko <maksim.a.boyko@gmail.com>2012-10-28 12:34:36 -0400
committerMaksim A. Boyko <maksim.a.boyko@gmail.com>2012-10-28 12:34:36 -0400
commitf1b61a3646f11484962e80368093364bbfd1f33c (patch)
treedcb94247fcd981ce55671efa5f3201df5c7da6e0
parente07cc3385fa276481a532c7008e8e1a23264df04 (diff)
tools: Add detect encodings
-rwxr-xr-xtools/migrate_db.py5
1 files changed, 4 insertions, 1 deletions
diff --git a/tools/migrate_db.py b/tools/migrate_db.py
index 18a70f8..254d806 100755
--- a/tools/migrate_db.py
+++ b/tools/migrate_db.py
@@ -2,6 +2,7 @@
import os
import sys
+import chardet
sys.path.append(os.path.join(os.path.dirname(__file__), '..'))
os.environ['DJANGO_SETTINGS_MODULE'] = 'scannerjammer.settings'
@@ -37,7 +38,8 @@ class MigrateDB(DB):
row = list(row)
for i, r in enumerate(row[:]):
if isinstance(r, str):
- row[i] = unicode(r, 'utf-8', 'replace')
+ detect = chardet.detect(r)
+ row[i] = unicode(r, detect['encoding'] or 'utf8', 'replace')
yield dict(zip(fields, row))
def get_radio_chat_table(self):
@@ -139,6 +141,7 @@ if __name__ == '__main__':
user=user,
datetime=datetime.fromtimestamp(row['date'])
)
+ print 'SJ Search Log Found'
except SJSearch.DoesNotExist:
sjsearch = SJSearch(
user=user,