1 #!/usr/bin/python 2 3 # DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER. 4 # 5 # Copyright (c) 2007 Sun Microsystems, Inc. All Rights Reserved. 6 # 7 # The contents of this file are subject to the terms of either the GNU Lesser 8 # General Public License Version 2.1 only ("LGPL") or the Common Development and 9 # Distribution License ("CDDL")(collectively, the "License"). You may not use this 10 # file except in compliance with the License. You can obtain a copy of the CDDL at 11 # http://www.opensource.org/licenses/cddl1.php and a copy of the LGPLv2.1 at 12 # http://www.opensource.org/licenses/lgpl-license.php. See the License for the 13 # specific language governing permissions and limitations under the License. When 14 # distributing the software, include this License Header Notice in each file and 15 # include the full text of the License in the License file as well as the 16 # following notice: 17 # 18 # NOTICE PURSUANT TO SECTION 9 OF THE COMMON DEVELOPMENT AND DISTRIBUTION LICENSE 19 # (CDDL) 20 # For Covered Software in this distribution, this License shall be governed by the 21 # laws of the State of California (excluding conflict-of-law provisions). 22 # Any litigation relating to this License shall be subject to the jurisdiction of 23 # the Federal Courts of the Northern District of California and the state courts 24 # of the State of California, with venue lying in Santa Clara County, California. 25 # 26 # Contributor(s): 27 # 28 # If you wish your version of this file to be governed by only the CDDL or only 29 # the LGPL Version 2.1, indicate your decision by adding "[Contributor]" elects to 30 # include this software in this distribution under the [CDDL or LGPL Version 2.1] 31 # license." If you don't indicate a single choice of license, a recipient has the 32 # option to distribute your version of this file under either the CDDL or the LGPL 33 # Version 2.1, or to extend the choice of license to its licensees as provided 34 # above. However, if you add LGPL Version 2.1 code and therefore, elected the LGPL 35 # Version 2 license, then the option applies only if the new code is made subject 36 # to such option by the copyright holder. 37 38 import codecs 39 from trie import Trie 40 41 class IMDict (Trie): 42 def __init__(self, fname): 43 super (IMDict, self).__init__() 44 self.load(fname) 45 46 def load(self, fname): 47 file = codecs.open(fname, 'r', 'utf-8') 48 for line in file: 49 line = line.strip() 50 if line[0] not in ('#', '<', '\n'): 51 word, id= line.split(' ')[0:2] 52 self.add(word, int(id)) 53 file.close() 54