[PYTHON] Script to create a Mac dictionary file

Suggestion in markdown format of emoji that can be used on github? A shit-like script that creates a dictionary file If you import the created file in the settings and convert it with "Eji", you will get an emoji that can be used on github like: hoge :.

http://www.emoji-cheat-sheet.com I'm bringing an emoji from.


EMOJI_DIR=/tmp/emoji_`date +"%Y%m%d_%H%M%S"`
mkdir -p $EMOJI_DIR
python emoji_to_dic.py > $EMOJI_DIR/mardkdown_utf8.txt
iconv -f utf-8 -t utf-16 $EMOJI_DIR/mardkdown_utf8.txt > $EMOJI_DIR/mardkdown.txt


#!/usr/bin/env python
# -*- coding: utf-8 -*-
import argparse
import codecs
import sys
import urllib
from HTMLParser import HTMLParser

Fixed variables
url = 'http://www.emoji-cheat-sheet.com/'

class EmojiParser(HTMLParser):
  def __init__(self):
    self.isToken = False
    self.token = ''

    ' Find software version tag.
  def handle_starttag(self, tag, attrs):
    self.isToken = False 
    attrs = dict(attrs)
    if tag != 'span':
    if 'class' not in attrs:
    if attrs['class'] != 'name':
    self.isToken = True

  ' Extraction version data.
  def handle_data(self, data):
    data = data.strip('\ \n:')
    if not self.isToken:
    if not data:
    print u'"Eji",":' + data + u':","Appellative"'

def GetParser():
  return EmojiParser()

if __name__ == "__main__":
  parser = GetParser()
  if not parser:
    print 'none parser.'
  sys.stdout = codecs.getwriter('utf_8')(sys.stdout)

