try: 
            with open(file_path, 'r') as f:
                doc = {}
                lines = f.readlines()
                # get first word of all the lines