{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "## Uczenie głębokie – przetwarzanie tekstu – laboratoria\n", "# 3. RNN" ] }, { "cell_type": "code", "execution_count": 60, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "usage: jupyter [-h] [--version] [--config-dir] [--data-dir] [--runtime-dir]\n", " [--paths] [--json] [--debug]\n", " [subcommand]\n", "\n", "Jupyter: Interactive Computing\n", "\n", "positional arguments:\n", " subcommand the subcommand to launch\n", "\n", "options:\n", " -h, --help show this help message and exit\n", " --version show the versions of core jupyter packages and exit\n", " --config-dir show Jupyter config dir\n", " --data-dir show Jupyter data dir\n", " --runtime-dir show Jupyter runtime dir\n", " --paths show all Jupyter paths. Add --json for machine-readable\n", " format.\n", " --json output paths as machine-readable json\n", " --debug output debug information about paths\n", "\n", "Available subcommands: console dejavu events execute kernel kernelspec lab\n", "labextension labhub migrate nbconvert notebook qtconsole run server\n", "troubleshoot trust\n", "\n", "Jupyter command `jupyter-nbextension` not found.\n" ] } ], "source": [ "!jupyter nbextension enable --py widgetsnbextension\n", "\n", "from collections import Counter\n", "import torch\n", "from torchtext.vocab import vocab\n", "from tqdm import tqdm\n", "from ipywidgets import FloatProgress\n", "\n", "import pandas as pd\n", "from nltk.tokenize import word_tokenize\n", "from unidecode import unidecode" ] }, { "cell_type": "code", "execution_count": 61, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "wczytano dane treningowe\n", "B-ORG O B-MISC O O O B-MISC O O O B-PER I-PER O B-LOC O O O B-ORG I-ORG O O O O O O B-MISC O O O O O B-MISC O O O O O O O O O O O O O O O B-LOC O O O O B-ORG I-ORG O O O B-PER I-PER O O O O O O O O O O O B-LOC O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-ORG O O O B-PER I-PER I-PER I-PER O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-ORG I-ORG O O O O O O O O O B-ORG O O B-PER I-PER O O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-PER O B-MISC O O O O B-LOC O B-LOC O O O O O O O B-MISC I-MISC I-MISC O B-MISC O O O O O O O O B-PER O O O O O O O B-ORG O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-MISC O O B-PER I-PER I-PER O O O B-PER O O B-ORG O O O O O O O O O O O O O O O O O O B-LOC O B-LOC O B-PER O O O O O B-ORG O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-MISC O O O O O O O O O O O O O O O O B-MISC O O O O O O O O O O O O O O O O O O O B-MISC O O O O O O B-MISC O O O O O B-LOC O O O O O O O O O O O O O O O O O O O B-LOC O O O O B-ORG I-ORG I-ORG I-ORG I-ORG O B-ORG O O B-PER I-PER I-PER O O B-ORG I-ORG O O B-LOC O O O O O O O O O O O O O O O B-MISC O O O O O O O O O O O O O O O O O O B-LOC O O O O B-LOC O O O O O O O O O O O O O O O O B-MISC O O O O O O O O O O EU rejects German call to boycott British lamb . Peter Blackburn BRUSSELS 1996-08-22 The European Commission said on Thursday it disagreed with German advice to consumers to shun British lamb until scientists determine whether mad cow disease can be transmitted to sheep . Germany 's representative to the European Union 's veterinary committee Werner Zwingmann said on Wednesday consumers should buy sheepmeat from countries other than Britain until the scientific advice was clearer . \" We do n't support any such recommendation because we do n't see any grounds for it , \" the Commission 's chief spokesman Nikolaus van der Pas told a news briefing . He said further scientific study was required and if it was found that action was needed it should be taken by the European Union . He said a proposal last month by EU Farm Commissioner Franz Fischler to ban sheep brains , spleens and spinal cords from the human and animal food chains was a highly specific and precautionary move to protect human health . Fischler proposed EU-wide measures after reports from Britain and France that under laboratory conditions sheep could contract Bovine Spongiform Encephalopathy ( BSE ) -- mad cow disease . But Fischler agreed to review his proposal after the EU 's standing veterinary committee , mational animal health officials , questioned if such action was justified as there was only a slight risk to human health . Spanish Farm Minister Loyola de Palacio had earlier accused Fischler at an EU farm ministers ' meeting of causing unjustified alarm through \" dangerous generalisation . \" . Only France and Britain backed Fischler 's proposal . The EU 's scientific veterinary and multidisciplinary committees are due to re-examine the issue early next month and make recommendations to the senior veterinary officials . Sheep have long been known to contract scrapie , a brain-wasting disease similar to BSE which is believed to have been transferred to cattle through feed containing animal waste . British farmers denied on Thursday there was any danger to human health from their sheep , but expressed concern that German government advice to consumers to avoid British lamb might influence consumers across Europe . \" What we have to be extremely careful of is how other countries are going to take Germany 's lead , \" Welsh National Farmers ' Union ( NFU ) chairman John Lloyd Jones said on BBC radio . Bonn has led efforts to protect public health after consumer confidence collapsed in March after a British report suggested humans could contract an illness similar to mad cow disease by eating contaminated beef . Germany imported 47,600 sheep from Britain last year , nearly half of total imports . It brought in 4,275 tonnes of British mutton , some 10 percent of overall imports . \n", "489\n", "489\n", "podzielono dane treningowe na słowa\n", "['eu', 'rejects', 'german', 'call', 'to', 'boycott', 'british', 'lamb', '.', '', 'peter', 'blackburn', '', 'brussels', '1996-08-22', '', 'the', 'european', 'commission', 'said', 'on', 'thursday', 'it', 'disagreed', 'with', 'german', 'advice', 'to', 'consumers', 'to', 'shun', 'british', 'lamb', 'until', 'scientists', 'determine', 'whether', 'mad', 'cow', 'disease', 'can', 'be', 'transmitted', 'to', 'sheep', '.', '', 'germany', \"'s\", 'representative', 'to', 'the', 'european', 'union', \"'s\", 'veterinary', 'committee', 'werner', 'zwingmann', 'said', 'on', 'wednesday', 'consumers', 'should', 'buy', 'sheepmeat', 'from', 'countries', 'other', 'than', 'britain', 'until', 'the', 'scientific', 'advice', 'was', 'clearer', '.', '', '\"', 'we', 'do', \"n't\", 'support', 'any', 'such', 'recommendation', 'because', 'we', 'do', \"n't\", 'see', 'any', 'grounds', 'for', 'it', ',', '\"', 'the', 'commission', \"'s\", 'chief', 'spokesman', 'nikolaus', 'van', 'der', 'pas', 'told', 'a', 'news', 'briefing', '.', '', 'he', 'said', 'further', 'scientific', 'study', 'was', 'required', 'and', 'if', 'it', 'was', 'found', 'that', 'action', 'was', 'needed', 'it', 'should', 'be', 'taken', 'by', 'the', 'european', 'union', '.', '', 'he', 'said', 'a', 'proposal', 'last', 'month', 'by', 'eu', 'farm', 'commissioner', 'franz', 'fischler', 'to', 'ban', 'sheep', 'brains', ',', 'spleens', 'and', 'spinal', 'cords', 'from', 'the', 'human', 'and', 'animal', 'food', 'chains', 'was', 'a', 'highly', 'specific', 'and', 'precautionary', 'move', 'to', 'protect', 'human', 'health', '.', '', 'fischler', 'proposed', 'eu-wide', 'measures', 'after', 'reports', 'from', 'britain', 'and', 'france', 'that', 'under', 'laboratory', 'conditions', 'sheep', 'could', 'contract', 'bovine', 'spongiform', 'encephalopathy', '(', 'bse', ')', '--', 'mad', 'cow', 'disease', '.', '', 'but', 'fischler', 'agreed', 'to', 'review', 'his', 'proposal', 'after', 'the', 'eu', \"'s\", 'standing', 'veterinary', 'committee', ',', 'mational', 'animal', 'health', 'officials', ',', 'questioned', 'if', 'such', 'action', 'was', 'justified', 'as', 'there', 'was', 'only', 'a', 'slight', 'risk', 'to', 'human', 'health', '.', '', 'spanish', 'farm', 'minister', 'loyola', 'de', 'palacio', 'had', 'earlier', 'accused', 'fischler', 'at', 'an', 'eu', 'farm', 'ministers', \"'\", 'meeting', 'of', 'causing', 'unjustified', 'alarm', 'through', '\"', 'dangerous', 'generalisation', '.', '\"', '', '.', '', 'only', 'france', 'and', 'britain', 'backed', 'fischler', \"'s\", 'proposal', '.', '', 'the', 'eu', \"'s\", 'scientific', 'veterinary', 'and', 'multidisciplinary', 'committees', 'are', 'due', 'to', 're-examine', 'the', 'issue', 'early', 'next', 'month', 'and', 'make', 'recommendations', 'to', 'the', 'senior', 'veterinary', 'officials', '.', '', 'sheep', 'have', 'long', 'been', 'known', 'to', 'contract', 'scrapie', ',', 'a', 'brain-wasting', 'disease', 'similar', 'to', 'bse', 'which', 'is', 'believed', 'to', 'have', 'been', 'transferred', 'to', 'cattle', 'through', 'feed', 'containing', 'animal', 'waste', '.', '', 'british', 'farmers', 'denied', 'on', 'thursday', 'there', 'was', 'any', 'danger', 'to', 'human', 'health', 'from', 'their', 'sheep', ',', 'but', 'expressed', 'concern', 'that', 'german', 'government', 'advice', 'to', 'consumers', 'to', 'avoid', 'british', 'lamb', 'might', 'influence', 'consumers', 'across', 'europe', '.', '', '\"', 'what', 'we', 'have', 'to', 'be', 'extremely', 'careful', 'of', 'is', 'how', 'other', 'countries', 'are', 'going', 'to', 'take', 'germany', \"'s\", 'lead', ',', '\"', 'welsh', 'national', 'farmers', \"'\", 'union', '(', 'nfu', ')', 'chairman', 'john', 'lloyd', 'jones', 'said', 'on', 'bbc', 'radio', '.', '', 'bonn', 'has', 'led', 'efforts', 'to', 'protect', 'public', 'health', 'after', 'consumer', 'confidence', 'collapsed', 'in', 'march', 'after', 'a', 'british', 'report', 'suggested', 'humans', 'could', 'contract', 'an', 'illness', 'similar', 'to', 'mad', 'cow', 'disease', 'by', 'eating', 'contaminated', 'beef', '.', '', 'germany', 'imported', '47,600', 'sheep', 'from', 'britain', 'last', 'year', ',', 'nearly', 'half', 'of', 'total', 'imports', '.', '', 'it', 'brought', 'in', '4,275', 'tonnes', 'of', 'british', 'mutton', ',', 'some', '10', 'percent', 'of', 'overall', 'imports', '.', '']\n", "489\n" ] } ], "source": [ "# odczytaj dane treningowe\n", "train = pd.read_csv('train/train.tsv', sep='\\t', names=['y', 'x'], header=None)\n", "\n", "print(\"wczytano dane treningowe\")\n", "print(train[\"y\"][0], train[\"x\"][0])\n", "\n", "print(len(train[\"y\"][0].split(\" \")))\n", "print(len(train[\"x\"][0].split(\" \")))\n", "\n", "# podziel dane treningowe na słowa\n", "# https://www.geeksforgeeks.org/python-word-embedding-using-word2vec/\n", "slowa_train = []\n", "for tekst in train[\"x\"]:\n", " pom = []\n", " for slowo in tekst.split(\" \"):\n", " #if slowo not in (\"<\",\"/s\",\">\",\"/S\",\"``\"):\n", " pom.append(slowo.lower())\n", " slowa_train.append(pom)\n", "print(\"podzielono dane treningowe na słowa\")\n", "\n", "print(slowa_train[0])\n", "print(len(slowa_train[0]))" ] }, { "cell_type": "code", "execution_count": 62, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "wczytano dane testowe dev-0\n", "CRICKET - LEICESTERSHIRE TAKE OVER AT TOP AFTER INNINGS VICTORY . LONDON 1996-08-30 West Indian all-rounder Phil Simmons took four for 38 on Friday as Leicestershire beat Somerset by an innings and 39 runs in two days to take over at the head of the county championship . Their stay on top , though , may be short-lived as title rivals Essex , Derbyshire and Surrey all closed in on victory while Kent made up for lost time in their rain-affected match against Nottinghamshire . After bowling Somerset out for 83 on the opening morning at Grace Road , Leicestershire extended their first innings by 94 runs before being bowled out for 296 with England discard Andy Caddick taking three for 83 . Trailing by 213 , Somerset got a solid start to their second innings before Simmons stepped in to bundle them out for 174 . Essex , however , look certain to regain their top spot after Nasser Hussain and Peter Such gave them a firm grip on their match against Yorkshire at Headingley . Hussain , considered surplus to England 's one-day requirements , struck 158 , his first championship century of the season , as Essex reached 372 and took a first innings lead of 82 . By the close Yorkshire had turned that into a 37-run advantage but off-spinner Such had scuttled their hopes , taking four for 24 in 48 balls and leaving them hanging on 119 for five and praying for rain . At the Oval , Surrey captain Chris Lewis , another man dumped by England , continued to silence his critics as he followed his four for 45 on Thursday with 80 not out on Friday in the match against Warwickshire . He was well backed by England hopeful Mark Butcher who made 70 as Surrey closed on 429 for seven , a lead of 234 . Derbyshire kept up the hunt for their first championship title since 1936 by reducing Worcestershire to 133 for five in their second innings , still 100 runs away from avoiding an innings defeat . Australian Tom Moody took six for 82 but Chris Adams , 123 , and Tim O'Gorman , 109 , took Derbyshire to 471 and a first innings lead of 233 . After the frustration of seeing the opening day of their match badly affected by the weather , Kent stepped up a gear to dismiss Nottinghamshire for 214 . They were held up by a gritty 84 from Paul Johnson but ex-England fast bowler Martin McCague took four for 55 . By stumps Kent had reached 108 for three . \n", "podzielono dane treningowe na słowa\n", "['cricket', '-', 'leicestershire', 'take', 'over', 'at', 'top', 'after', 'innings', 'victory', '.', '', 'london', '1996-08-30', '', 'west', 'indian', 'all-rounder', 'phil', 'simmons', 'took', 'four', 'for', '38', 'on', 'friday', 'as', 'leicestershire', 'beat', 'somerset', 'by', 'an', 'innings', 'and', '39', 'runs', 'in', 'two', 'days', 'to', 'take', 'over', 'at', 'the', 'head', 'of', 'the', 'county', 'championship', '.', '', 'their', 'stay', 'on', 'top', ',', 'though', ',', 'may', 'be', 'short-lived', 'as', 'title', 'rivals', 'essex', ',', 'derbyshire', 'and', 'surrey', 'all', 'closed', 'in', 'on', 'victory', 'while', 'kent', 'made', 'up', 'for', 'lost', 'time', 'in', 'their', 'rain-affected', 'match', 'against', 'nottinghamshire', '.', '', 'after', 'bowling', 'somerset', 'out', 'for', '83', 'on', 'the', 'opening', 'morning', 'at', 'grace', 'road', ',', 'leicestershire', 'extended', 'their', 'first', 'innings', 'by', '94', 'runs', 'before', 'being', 'bowled', 'out', 'for', '296', 'with', 'england', 'discard', 'andy', 'caddick', 'taking', 'three', 'for', '83', '.', '', 'trailing', 'by', '213', ',', 'somerset', 'got', 'a', 'solid', 'start', 'to', 'their', 'second', 'innings', 'before', 'simmons', 'stepped', 'in', 'to', 'bundle', 'them', 'out', 'for', '174', '.', '', 'essex', ',', 'however', ',', 'look', 'certain', 'to', 'regain', 'their', 'top', 'spot', 'after', 'nasser', 'hussain', 'and', 'peter', 'such', 'gave', 'them', 'a', 'firm', 'grip', 'on', 'their', 'match', 'against', 'yorkshire', 'at', 'headingley', '.', '', 'hussain', ',', 'considered', 'surplus', 'to', 'england', \"'s\", 'one-day', 'requirements', ',', 'struck', '158', ',', 'his', 'first', 'championship', 'century', 'of', 'the', 'season', ',', 'as', 'essex', 'reached', '372', 'and', 'took', 'a', 'first', 'innings', 'lead', 'of', '82', '.', '', 'by', 'the', 'close', 'yorkshire', 'had', 'turned', 'that', 'into', 'a', '37-run', 'advantage', 'but', 'off-spinner', 'such', 'had', 'scuttled', 'their', 'hopes', ',', 'taking', 'four', 'for', '24', 'in', '48', 'balls', 'and', 'leaving', 'them', 'hanging', 'on', '119', 'for', 'five', 'and', 'praying', 'for', 'rain', '.', '', 'at', 'the', 'oval', ',', 'surrey', 'captain', 'chris', 'lewis', ',', 'another', 'man', 'dumped', 'by', 'england', ',', 'continued', 'to', 'silence', 'his', 'critics', 'as', 'he', 'followed', 'his', 'four', 'for', '45', 'on', 'thursday', 'with', '80', 'not', 'out', 'on', 'friday', 'in', 'the', 'match', 'against', 'warwickshire', '.', '', 'he', 'was', 'well', 'backed', 'by', 'england', 'hopeful', 'mark', 'butcher', 'who', 'made', '70', 'as', 'surrey', 'closed', 'on', '429', 'for', 'seven', ',', 'a', 'lead', 'of', '234', '.', '', 'derbyshire', 'kept', 'up', 'the', 'hunt', 'for', 'their', 'first', 'championship', 'title', 'since', '1936', 'by', 'reducing', 'worcestershire', 'to', '133', 'for', 'five', 'in', 'their', 'second', 'innings', ',', 'still', '100', 'runs', 'away', 'from', 'avoiding', 'an', 'innings', 'defeat', '.', '', 'australian', 'tom', 'moody', 'took', 'six', 'for', '82', 'but', 'chris', 'adams', ',', '123', ',', 'and', 'tim', \"o'gorman\", ',', '109', ',', 'took', 'derbyshire', 'to', '471', 'and', 'a', 'first', 'innings', 'lead', 'of', '233', '.', '', 'after', 'the', 'frustration', 'of', 'seeing', 'the', 'opening', 'day', 'of', 'their', 'match', 'badly', 'affected', 'by', 'the', 'weather', ',', 'kent', 'stepped', 'up', 'a', 'gear', 'to', 'dismiss', 'nottinghamshire', 'for', '214', '.', '', 'they', 'were', 'held', 'up', 'by', 'a', 'gritty', '84', 'from', 'paul', 'johnson', 'but', 'ex-england', 'fast', 'bowler', 'martin', 'mccague', 'took', 'four', 'for', '55', '.', '', 'by', 'stumps', 'kent', 'had', 'reached', '108', 'for', 'three', '.', '']\n", "456\n" ] } ], "source": [ "# odczytaj dane testowe dev-0\n", "test_dev0 = pd.read_csv('dev-0/in.tsv', sep='\\t', names=['x'], header=None)\n", "\n", "print(\"wczytano dane testowe dev-0\")\n", "print(test_dev0[\"x\"][0])\n", "\n", "# podziel dane testowe na słowa\n", "# https://www.geeksforgeeks.org/python-word-embedding-using-word2vec/\n", "slowa_test_dev0 = []\n", "for tekst in test_dev0[\"x\"]:\n", " pom = []\n", " for slowo in tekst.split(\" \"):\n", " #if slowo not in (\"<\",\"/s\",\">\",\"/S\",\"``\"):\n", " pom.append(slowo.lower())\n", " slowa_test_dev0.append(pom)\n", "print(\"podzielono dane treningowe na słowa\")\n", "\n", "print(slowa_test_dev0[0])\n", "print(len(slowa_test_dev0[0]))" ] }, { "cell_type": "code", "execution_count": 63, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "wczytano dane testowe A\n", "SOCCER - JAPAN GET LUCKY WIN , CHINA IN SURPRISE DEFEAT . Nadim Ladki AL-AIN , United Arab Emirates 1996-12-06 Japan began the defence of their Asian Cup title with a lucky 2-1 win against Syria in a Group C championship match on Friday . But China saw their luck desert them in the second match of the group , crashing to a surprise 2-0 defeat to newcomers Uzbekistan . China controlled most of the match and saw several chances missed until the 78th minute when Uzbek striker Igor Shkvyrin took advantage of a misdirected defensive header to lob the ball over the advancing Chinese keeper and into an empty net . Oleg Shatskiku made sure of the win in injury time , hitting an unstoppable left foot shot from just outside the area . The former Soviet republic was playing in an Asian Cup finals tie for the first time . Despite winning the Asian Games title two years ago , Uzbekistan are in the finals as outsiders . Two goals from defensive errors in the last six minutes allowed Japan to come from behind and collect all three points from their opening meeting against Syria . Takuya Takagi scored the winner in the 88th minute , rising to head a Hiroshige Yanagimoto cross towards the Syrian goal which goalkeeper Salem Bitar appeared to have covered but then allowed to slip into the net . It was the second costly blunder by Syria in four minutes . Defender Hassan Abbas rose to intercept a long ball into the area in the 84th minute but only managed to divert it into the top corner of Bitar 's goal . Nader Jokhadar had given Syria the lead with a well-struck header in the seventh minute . Japan then laid siege to the Syrian penalty area for most of the game but rarely breached the Syrian defence . Bitar pulled off fine saves whenever they did . Japan coach Shu Kamo said : ' ' The Syrian own goal proved lucky for us . The Syrians scored early and then played defensively and adopted long balls which made it hard for us . ' ' Japan , co-hosts of the World Cup in 2002 and ranked 20th in the world by FIFA , are favourites to regain their title here . Hosts UAE play Kuwait and South Korea take on Indonesia on Saturday in Group A matches . All four teams are level with one point each from one game . \n", "podzielono dane treningowe na słowa\n", "['soccer', '-', 'japan', 'get', 'lucky', 'win', ',', 'china', 'in', 'surprise', 'defeat', '.', '', 'nadim', 'ladki', '', 'al-ain', ',', 'united', 'arab', 'emirates', '1996-12-06', '', 'japan', 'began', 'the', 'defence', 'of', 'their', 'asian', 'cup', 'title', 'with', 'a', 'lucky', '2-1', 'win', 'against', 'syria', 'in', 'a', 'group', 'c', 'championship', 'match', 'on', 'friday', '.', '', 'but', 'china', 'saw', 'their', 'luck', 'desert', 'them', 'in', 'the', 'second', 'match', 'of', 'the', 'group', ',', 'crashing', 'to', 'a', 'surprise', '2-0', 'defeat', 'to', 'newcomers', 'uzbekistan', '.', '', 'china', 'controlled', 'most', 'of', 'the', 'match', 'and', 'saw', 'several', 'chances', 'missed', 'until', 'the', '78th', 'minute', 'when', 'uzbek', 'striker', 'igor', 'shkvyrin', 'took', 'advantage', 'of', 'a', 'misdirected', 'defensive', 'header', 'to', 'lob', 'the', 'ball', 'over', 'the', 'advancing', 'chinese', 'keeper', 'and', 'into', 'an', 'empty', 'net', '.', '', 'oleg', 'shatskiku', 'made', 'sure', 'of', 'the', 'win', 'in', 'injury', 'time', ',', 'hitting', 'an', 'unstoppable', 'left', 'foot', 'shot', 'from', 'just', 'outside', 'the', 'area', '.', '', 'the', 'former', 'soviet', 'republic', 'was', 'playing', 'in', 'an', 'asian', 'cup', 'finals', 'tie', 'for', 'the', 'first', 'time', '.', '', 'despite', 'winning', 'the', 'asian', 'games', 'title', 'two', 'years', 'ago', ',', 'uzbekistan', 'are', 'in', 'the', 'finals', 'as', 'outsiders', '.', '', 'two', 'goals', 'from', 'defensive', 'errors', 'in', 'the', 'last', 'six', 'minutes', 'allowed', 'japan', 'to', 'come', 'from', 'behind', 'and', 'collect', 'all', 'three', 'points', 'from', 'their', 'opening', 'meeting', 'against', 'syria', '.', '', 'takuya', 'takagi', 'scored', 'the', 'winner', 'in', 'the', '88th', 'minute', ',', 'rising', 'to', 'head', 'a', 'hiroshige', 'yanagimoto', 'cross', 'towards', 'the', 'syrian', 'goal', 'which', 'goalkeeper', 'salem', 'bitar', 'appeared', 'to', 'have', 'covered', 'but', 'then', 'allowed', 'to', 'slip', 'into', 'the', 'net', '.', '', 'it', 'was', 'the', 'second', 'costly', 'blunder', 'by', 'syria', 'in', 'four', 'minutes', '.', '', 'defender', 'hassan', 'abbas', 'rose', 'to', 'intercept', 'a', 'long', 'ball', 'into', 'the', 'area', 'in', 'the', '84th', 'minute', 'but', 'only', 'managed', 'to', 'divert', 'it', 'into', 'the', 'top', 'corner', 'of', 'bitar', \"'s\", 'goal', '.', '', 'nader', 'jokhadar', 'had', 'given', 'syria', 'the', 'lead', 'with', 'a', 'well-struck', 'header', 'in', 'the', 'seventh', 'minute', '.', '', 'japan', 'then', 'laid', 'siege', 'to', 'the', 'syrian', 'penalty', 'area', 'for', 'most', 'of', 'the', 'game', 'but', 'rarely', 'breached', 'the', 'syrian', 'defence', '.', '', 'bitar', 'pulled', 'off', 'fine', 'saves', 'whenever', 'they', 'did', '.', '', 'japan', 'coach', 'shu', 'kamo', 'said', ':', \"'\", \"'\", 'the', 'syrian', 'own', 'goal', 'proved', 'lucky', 'for', 'us', '.', '', 'the', 'syrians', 'scored', 'early', 'and', 'then', 'played', 'defensively', 'and', 'adopted', 'long', 'balls', 'which', 'made', 'it', 'hard', 'for', 'us', '.', \"'\", '', \"'\", '', 'japan', ',', 'co-hosts', 'of', 'the', 'world', 'cup', 'in', '2002', 'and', 'ranked', '20th', 'in', 'the', 'world', 'by', 'fifa', ',', 'are', 'favourites', 'to', 'regain', 'their', 'title', 'here', '.', '', 'hosts', 'uae', 'play', 'kuwait', 'and', 'south', 'korea', 'take', 'on', 'indonesia', 'on', 'saturday', 'in', 'group', 'a', 'matches', '.', '', 'all', 'four', 'teams', 'are', 'level', 'with', 'one', 'point', 'each', 'from', 'one', 'game', '.', '']\n" ] } ], "source": [ "# odczytaj dane testowe A\n", "test_A = pd.read_csv('test-A/in.tsv', sep='\\t', names=['x'], header=None)\n", "\n", "print(\"wczytano dane testowe A\")\n", "print(test_A[\"x\"][0])\n", "\n", "# podziel dane testowe na słowa\n", "# https://www.geeksforgeeks.org/python-word-embedding-using-word2vec/\n", "slowa_test_A = []\n", "for tekst in test_A[\"x\"]:\n", " pom = []\n", " for slowo in tekst.split(\" \"):\n", " #if slowo not in (\"<\",\"/s\",\">\",\"/S\",\"``\"):\n", " pom.append(slowo.lower())\n", " slowa_test_A.append(pom)\n", "print(\"podzielono dane treningowe na słowa\")\n", "\n", "print(slowa_test_A[0])" ] }, { "cell_type": "code", "execution_count": 64, "metadata": {}, "outputs": [], "source": [ "def build_vocab(dataset):\n", " counter = Counter()\n", " for document in dataset:\n", " counter.update(document)\n", " return vocab(counter, specials=[\"\", \"\", \"\", \"\"])" ] }, { "cell_type": "code", "execution_count": 65, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "21014\n", "['', '', '', '', 'eu', 'rejects', 'german', 'call', 'to', 'boycott', 'british', 'lamb', '.', '', 'peter', 'blackburn', 'brussels', '1996-08-22', 'the', 'european', 'commission', 'said', 'on', 'thursday', 'it', 'disagreed', 'with', 'advice', 'consumers', 'shun', 'until', 'scientists', 'determine', 'whether', 'mad', 'cow', 'disease', 'can', 'be', 'transmitted', 'sheep', 'germany', \"'s\", 'representative', 'union', 'veterinary', 'committee', 'werner', 'zwingmann', 'wednesday', 'should', 'buy', 'sheepmeat', 'from', 'countries', 'other', 'than', 'britain', 'scientific', 'was', 'clearer', '\"', 'we', 'do', \"n't\", 'support', 'any', 'such', 'recommendation', 'because', 'see', 'grounds', 'for', ',', 'chief', 'spokesman', 'nikolaus', 'van', 'der', 'pas', 'told', 'a', 'news', 'briefing', 'he', 'further', 'study', 'required', 'and', 'if', 'found', 'that', 'action', 'needed', 'taken', 'by', 'proposal', 'last', 'month', 'farm', 'commissioner', 'franz', 'fischler', 'ban', 'brains', 'spleens', 'spinal', 'cords', 'human', 'animal', 'food', 'chains', 'highly', 'specific', 'precautionary', 'move', 'protect', 'health', 'proposed', 'eu-wide', 'measures', 'after', 'reports', 'france', 'under', 'laboratory', 'conditions', 'could', 'contract', 'bovine', 'spongiform', 'encephalopathy', '(', 'bse', ')', '--', 'but', 'agreed', 'review', 'his', 'standing', 'mational', 'officials', 'questioned', 'justified', 'as', 'there', 'only', 'slight', 'risk', 'spanish', 'minister', 'loyola', 'de', 'palacio', 'had', 'earlier', 'accused', 'at', 'an', 'ministers', \"'\", 'meeting', 'of', 'causing', 'unjustified', 'alarm', 'through', 'dangerous', 'generalisation', 'backed', 'multidisciplinary', 'committees', 'are', 'due', 're-examine', 'issue', 'early', 'next', 'make', 'recommendations', 'senior', 'have', 'long', 'been', 'known', 'scrapie', 'brain-wasting', 'similar', 'which', 'is', 'believed', 'transferred', 'cattle', 'feed', 'containing', 'waste', 'farmers', 'denied', 'danger', 'their', 'expressed', 'concern', 'government', 'avoid', 'might', 'influence', 'across', 'europe', 'what', 'extremely', 'careful', 'how', 'going', 'take', 'lead', 'welsh', 'national', 'nfu', 'chairman', 'john', 'lloyd', 'jones', 'bbc', 'radio', 'bonn', 'has', 'led', 'efforts', 'public', 'consumer', 'confidence', 'collapsed', 'in', 'march', 'report', 'suggested', 'humans', 'illness', 'eating', 'contaminated', 'beef', 'imported', '47,600', 'year', 'nearly', 'half', 'total', 'imports', 'brought', '4,275', 'tonnes', 'mutton', 'some', '10', 'percent', 'overall', 'rare', 'hendrix', 'song', 'draft', 'sells', 'almost', '$', '17,000', 'london', 'handwritten', 'u.s.', 'guitar', 'legend', 'jimi', 'sold', 'auction', 'late', 'musician', 'favourite', 'possessions', 'florida', 'restaurant', 'paid', '10,925', 'pounds', '16,935', 'ai', 'no', 'telling', 'penned', 'piece', 'hotel', 'stationery', '1966', 'end', 'january', '1967', 'concert', 'english', 'city', 'nottingham', 'threw', 'sheet', 'paper', 'into', 'audience', 'where', 'retrieved', 'fan', 'buyers', 'also', 'snapped', 'up', '16', 'items', 'were', 'put', 'former', 'girlfriend', 'kathy', 'etchingham', 'who', 'lived', 'him', '1969', 'they', 'included', 'black', 'lacquer', 'mother', 'pearl', 'inlaid', 'box', 'used', 'store', 'drugs', 'anonymous', 'australian', 'purchaser', 'bought', '5,060', '7,845', 'guitarist', 'died', 'overdose', '1970', 'aged', '27', 'china', 'says', 'taiwan', 'spoils', 'atmosphere', 'talks', 'beijing', 'taipei', 'spoiling', 'resumption', 'strait', 'visit', 'ukraine', 'taiwanese', 'vice', 'president', 'lien', 'chan', 'this', 'week', 'infuriated', 'speaking', 'hours', 'chinese', 'state', 'media', 'time', 'right', 'engage', 'political', 'foreign', 'ministry', 'shen', 'guofang', 'reuters', ':', 'necessary', 'opening', 'disrupted', 'authorities', 'quoted', 'top', 'negotiator', 'tang', 'shubei', 'visiting', 'group', 'rivals', 'hold', 'now', 'two', 'sides', '...', 'hostility', 'overseas', 'edition', 'people', 'daily', 'saying', 'television', 'interview', 'read', 'comments', 'gave', 'details', 'why', 'considered', 'considers', 'renegade', 'province', 'opposed', 'all', 'gain', 'greater', 'international', 'recognition', 'rival', 'island', 'practical', 'steps', 'towards', 'goal', 'consultations', 'held', 'set', 'format', 'official', 'xinhua', 'agency', 'executive', 'association', 'relations', 'straits', 'july', 'car', 'registrations', '14.2', 'pct', 'yr', '/', 'frankfurt', 'first-time', 'motor', 'vehicles', 'jumped', 'year-earlier', 'period', 'federal', 'office', '356,725', 'new', 'cars', 'registered', '1996', '304,850', 'passenger', '15,613', 'trucks', 'figures', 'represent', '13.6', 'increase', '2.2', 'decline', '1995', 'motor-bike', 'registration', 'rose', '32.7', 'growth', 'partly', 'increased', 'number', 'germans', 'buying', 'abroad', 'while', 'manufacturers', 'domestic', 'demand', 'weak', 'posted', 'gains', 'numbers', 'volkswagen', 'ag', 'won', '77,719', 'slightly', 'more', 'quarter', 'opel', 'together', 'general', 'motors', 'came', 'second', 'place', '49,269', '16.4', 'figure', 'third', 'ford', '35,563', 'or', '11.7', 'seat', 'porsche', 'fewer', 'compared', '3,420', '5522', 'fell', '554', '643', 'greek', 'socialists', 'give', 'green', 'light', 'pm', 'elections', 'athens', 'socialist', 'party', 'bureau', 'prime', 'costas', 'simitis', 'snap', 'its', 'secretary', 'skandalidis', 'reporters', 'announcement', 'cabinet', 'later', 'dimitris', 'kontogiannis', 'newsroom', '+301', '3311812-4', 'bayervb', 'sets', 'c$', '100', 'million', 'six-year', 'bond', 'following', 'announced', 'manager', 'toronto', 'dominion', 'borrower', 'bayerische', 'vereinsbank', 'amt', 'mln', 'coupon', '6.625', 'maturity', '24.sep.02', 'type', 'straight', 'iss', 'price', '100.92', 'pay', 'date', '24.sep.96', 'full', 'fees', '1.875', 'reoffer', '99.32', 'spread', '+20', 'bp', 'moody', 'aa1', 'listing', 'lux', 'freq', '=', 's&p', 'denoms', 'k', '1-10-100', 'sale', 'limits', 'us', 'uk', 'ca', 'neg', 'plg', 'crs', 'deflt', 'force', 'maj', 'gov', 'law', 'home', 'ctry', 'tax', 'provs', 'standard', 'mgt', 'und', '0.275', 'sell', 'conc', '1.60', 'praecip', 'underlying', 'govt', '7.0', 'sept', '2001', 'notes', 'joint', '+44', '171', '542', '7658', 'venantius', '300', '1999', 'frn', 'floating-rate', 'lehman', 'brothers', 'ab', 'swedish', 'mortgage', '-', '12.5', '21.jan.99', 'base', '3m', 'libor', 's23.sep.96', 'aa3', '99.956', 'aa+', 's', 'short', 'first', 'jp', 'fr', 'yes', 'ipma', '2', 'sweden', '5', 'issued', 'off', 'emtn', 'programme', '8863', 'port', 'update', 'syria', 'lloyds', 'shipping', 'intelligence', 'service', 'lattakia', 'aug', 'waiting', 'tartous', 'presently', '24', 'israel', 'plays', 'down', 'fears', 'war', 'colleen', 'siegel', 'jerusalem', 'outgoing', 'peace', 'current', 'tensions', 'between', 'appeared', 'storm', 'teacup', 'itamar', 'rabinovich', 'ambassador', 'washington', 'conducted', 'unfruitful', 'negotiations', 'looked', 'like', 'damascus', 'wanted', 'talk', 'rather', 'fight', 'appears', 'me', 'syrian', 'priority', 'still', 'negotiate', 'syrians', 'confused', 'definitely', 'tense', 'assessment', 'here', 'essentially', 'winding', 'term', 'will', 'replaced', 'eliahu', 'ben-elissar', 'israeli', 'envoy', 'egypt', 'right-wing', 'likud', 'politician', 'sent', 'message', 'via', 'committed', 'open', 'without', 'preconditions', 'slammed', 'creating', 'called', 'launching', 'hysterical', 'campaign', 'against', 'reported', 'recently', 'test', 'fired', 'missile', 'arms', 'purchases', 'defensive', 'purposes', 'hafez', 'al-', 'assad', 'ready', 'enter', 'david', 'levy', 'tension', 'mounted', 'since', 'benjamin', 'netanyahu', 'took', 'june', 'vowing', 'retain', 'golan', 'heights', 'captured', 'middle', 'east', 'israeli-syrian', 'deadlocked', 'over', '1991', 'despite', 'previous', 'willingness', 'concessions', 'february', 'voices', 'coming', 'out', 'bad', 'not', 'good', 'expressions', 'declarations', 'must', 'worrying', 'artificial', 'very', 'those', 'become', 'prisoners', 'expect', 'face', 'answer', 'our', 'want', 'god', 'forbid', 'one', 'benefits', 'wars', 'channel', 'calming', 'signal', 'source', 'spokesmen', 'confirm', 'messages', 'reassure', 'cairo', 'united', 'states', 'moscow', 'polish', 'diplomat', 'denies', 'nurses', 'stranded', 'libya', 'tunis', 'tabloid', 'refusing', 'exit', 'visas', 'trying', 'return', 'working', 'north', 'african', 'country', 'true', 'today', 'knowledge', 'nurse', 'kept', 'her', 'received', 'complaint', 'embassy', 'charge', \"d'affaires\", 'tripoli', 'tadeusz', 'awdankiewicz', 'telephone', 'poland', 'labour', 'would', 'send', 'team', 'investigate', 'probe', 'prompted', 'complaining', 'about', 'work', 'non-payment', 'salaries', 'estimated', '800', 'iranian', 'opposition', 'leaders', 'meet', 'baghdad', 'hassan', 'hafidh', 'exile', 'based', 'iraq', 'vowed', 'extend', 'iran', 'kurdish', 'rebels', 'attacked', 'troops', 'deep', 'inside', 'mujahideen', 'khalq', 'statement', 'leader', 'massoud', 'rajavi', 'met', 'secretary-general', 'kurdistan', 'democratic', 'kdpi', 'rastegar', 'voiced', 'rebel', 'kurds', 'emphasised', 'resistance', 'continue', 'stand', 'side', 'compatriots', 'movement', 'signals', 'level', 'cooperation', 'oppositions', 'heavily', 'bombarded', 'targets', 'northern', 'pursuit', 'guerrillas', 'iraqi', 'areas', 'outside', 'control', 'bordering', 'patriotic', 'puk', 'kdp', 'main', 'factions', 'forces', 'ousted', 'kuwait', 'gulf', 'clashes', 'parties', 'broke', 'weekend', 'most', 'serious', 'fighting', 'u.s.-sponsored', 'ceasefire', 'shelling', 'positions', 'qasri', 'region', 'suleimaniya', 'near', 'border', 'days', 'killed', 'wounded', 'attack', 'both', 'turkey', 'mount', 'air', 'land', 'strikes', 'own', 'u.s.-led', 'southern', 'protects', 'possible', 'attacks', 'saudi', 'riyal', 'rates', 'steady', 'quiet', 'summer', 'trade', 'manama', 'spot', 'dollar', 'interbank', 'deposit', 'mainly', 'dealers', 'kingdom', 'changes', 'market', 'holidays', 'dealer', '3.7504', '06', 'one-month', 'deposits', '5-1/2', '3/8', 'three', 'months', '5-5/8', '1/2', 'six', '5-3/4', '5/8', 'one-year', 'funds', '5-7/8', 'approves', 'arafat', 'flight', 'west', 'bank', 'palestinian', 'yasser', 'permission', 'fly', 'territory', 'ending', 'brief', 'israeli-plo', 'crisis', 'adviser', 'problem', 'aircraft', 'pass', 'airspace', 'expected', 'travel', 'before', 'monday', 'nabil', 'abu', 'rdainah', 'scheduled', 'shimon', 'peres', 'town', 'ramallah', 'venue', 'changed', 'gaza', 'clearance', 'helicopters', 'stop', 'keeping', 'grounded', 'subsequently', 'cancelled', 'plo', 'civilian', 'affairs', 'allenby', 'bridge', 'crossing', 'jordan', 'decided', 'flying', 'lifted', 'busy', 'schedule', 'free', 'palestinians', 'barred', 'erez', 'checkpoint', 'planned', 'overflying', 'helicopter', 'attempt', 'bar', 'defeated', 'may', 'undermine', 'authority', 'conduct', 'afghan', 'uae', 'taleban', 'guards', 'hilary', 'gush', 'dubai', 'arab', 'emirates', 'russian', 'hostages', 'escaped', 'militia', 'afghanistan', 'few', 'dhabi', 'touch', 'issuing', 'them', 'documents', 'homeland', 'objection', 'added', 'islamic', 'overpowered', 'seven', 'aircrew', 'sharjah', 'friday', 'board', 'captivity', 'kandahar', 'hand', 'red', 'crescent', 'possibly', 'tuesday', 'silent', 'when', 'asked', 'back', 'capital', 'kabul', 'headquarters', 'controlled', 'burhanuddin', 'rabbani', 'overthrow', 'men', '20s', 'currently', 'did', 'elaborate', 'russians', 'aerostan', 'firm', 'republic', 'tatarstan', 'hostage', 'mig-19', 'fighter', 'forced', 'cargo', 'plane', 'august', 'shipment', 'ammunition', 'albania', 'evidence', 'military', 'crew', 'nationality', 'coincidental', 'numerous', 'diplomatic', 'attempts', 'failed', 'armed', 'kalashnikov', 'automatic', 'rifles', 'doing', 'regular', 'maintenance', 'ilyushin', '76', 'left', 'sunday', 'saddam', 'meets', 'russia', 'zhirinovsky', 'hussein', 'ultra-nationalist', 'vladimir', 'maintain', 'friendship', 'newspapers', 'stressed', 'during', 'keenness', 'papers', 'liberal', 'duma', 'parliament', 'calling', 'immediate', 'lifting', 'embargo', 'imposed', '1990', 'invasion', 'press', 'help', 'u.n.', 'sanctions', 'blamed', 'delaying', 'establishment', 'ties', 'namely', 'economic', 'resume', 'visited', 'twice', 'october', 'invited', 'attend', 'referendum', 'presidency', 'extended', 'years', 'digest', '22', 'these', 'leading', 'stories', 'verified', 'does', 'vouch', 'accuracy', 'thawra', 'turkish', 'part', 'fair', 'november', 'shipload', '12', 'rice', 'arrives', 'umm', 'qasr', 'lebanon', 'beirut', 'an-nahar', 'confrontation', 'escalating', 'hizbollah', 'hariri', 'threats', 'serve', 'as-safir', 'speaker', 'berri', 'preparing', 'parliamentary', 'battle', '..', 'lists', 'prepared', 'al-anwar', 'continued', 'criticism', 'violation', 'incidents', 'occurred', 'ad-diyar', 'financial', 'pakistan', 'step', 'election', 'incomplete', 'list', \"nida'a\", 'al-watan', 'maronite', 'patriarch', 'sfeir', 'sorrow', 'violations', 'cme', 'live', 'feeder', 'calls', 'range', 'mixed', 'chicago', 'futures', 'ranged', '0.200', 'cent', 'higher', '0.100', 'lower', 'livestock', 'analysts', 'strong', 'tone', 'cash', 'markets', 'prompt', 'outlook', 'bullish', 'cattle-on-feed', 'lend', 'bull', 'spreading', 'however', 'likely', 'prices', 'drift', 'evening', 'ahead', 'record', 'amount', 'feedlot', 'traded', 'kindercare', 'debt', 'hit', 'q1', 'results', 'montgomery', 'ala', 'learning', 'centers', 'inc', 'buyback', 'mean', 'extraordinary', 'loss', '1.2', 'fiscal', '1997', 'company', 'began', '1', '30', 'par', 'value', 'outstanding', '10-3/8', '31.5', 'philip', 'maslowe', 'officer', 'preschool', 'child', 'care', 'offered', 'opportunity', 'reduce', 'weighted', 'average', 'interest', 'costs', 'improve', 'future', 'flows', 'earnings', 'research', 'alert', 'starts', 'snet', 'analyst', 'blake', 'bath', 'started', 'england', 'telecommunciations', 'corp', 'outperform', 'rating', '12-month', 'target', '45', 'estimate', '3.09', 'per', 'share', 'immediately', 'available', 'closed', '38-1/2', 'e.', 'auchard', 'wall', 'street', '212-859-1736', 'gateway', 'data', 'sciences', 'q2', 'net', 'rises', 'phoenix', 'summary', 'consolidated', 'thousands', 'except', 'ended', 'jul', '31', 'income', 'revenue', '10,756', '13,102', '7,961', '5,507', 'software', '2,383', '1,558', '1,086', '1,074', 'services', '1,154', '692', '624', '465', 'operating', '906', '962', '599', '515', '821', '512', '565', '301', '0.31', '0.34', '0.19', '0.20', 'jan', 'balance', '5,755', '881', 'equivalents', '2,386', '93', 'assets', '14,196', '7,138', 'shareholders', 'equity', '5,951', '1,461', 'backing', 'chooses', 'le', 'monde', 'paris', 'afternoon', 'dated', '23', 'front', 'page', 'africans', 'seeking', 'renew', 'obtain', 'residence', 'rights', 'say', 'alain', 'juppe', 'proposals', 'insufficient', 'hunger', 'strike', 'enters', '49th', 'day', 'church', 'rally', 'attracts', '8,000', 'sympathisers', 'flnc', 'corsican', 'nationalist', 'announces', 'truce', 'night', 'business', 'pages', 'shutdown', 'bally', 'french', 'factories', 'points', 'shoe', 'industry', 'undercut', 'low-wage', 'competition', 'failure', 'keep', 'abreast', 'trends', 'sud-ptt', 'telecom', 'elements', 'social', 'unrest', 'weeks', '+33', '42', '21', '53', '81', 'well', 'repairs', 'lift', 'heidrun', 'oil', 'output', 'statoil', 'oslo', 'plugged', 'water', 'injection', 'wells', 'oilfield', 'mid-norway', 'reopened', 'operator', 'den', 'norske', 'stats', 'oljeselskap', 'accounted', 'dip', '30,000', 'barrels', 'bpd', 'roughly', '220,000', 'according', 'status', 'weekly', 'newsletter', 'reperforated', 'gravel', 'pumped', 'reservoir', 'plugging', 'problems', '+47', '50', '41', 'finnish', 'april', 'surplus', '3.8', 'billion', 'markka', 'ncb', 'helsinki', 'finland', '3.83', '3.43', 'customs', 'exports', 'year-on-year', '96', 'jan-april', '95', '10,663', '10,725', '43,430', '40,989', '14,494', '14,153', '56,126', '56,261', '+3,831', '+3,428', '+12,696', '+15,272', 'january-april', 'import', 'revised', '39,584', 'export', '55,627', '3.2', 'projected', '14.5', '11.3', 'monthly', 'statistics', 'lagging', 'behind', 'procedures', 'joined', 'start', '+358', '0', '680', '245', 'dutch', 'raises', 'tap', '99.95', 'amsterdam', 'finance', 'raised', 'sales', '5.75', 'september', '2002', '99.90', 'being', '07.00', 'gmt', '15.00', 'notice', '2.3', 'guilders', 'close', '+31', '20', '504', '5000', 'tells', 'agriculture', 'meat', 'animals', 'cleared', 'panels', 'done', 'quickly', 'preference', 'zdf', 'i', 'concrete', 'too', 'many', 'holes', 'know', 'filled', 'ensure', 'protection', 'tops', 'priorities', 'dealing', 'erupted', 'acknowledged', 'rethink', 'use', 'suspect', 'tissue', 'experts', 'banning', 'members', 'given', 'question', 'studied', 'separately', 'perfectly', 'safe', 'eat', 'admitted', 'link', 'fatal', 'equivalent', 'worldwide', 'summit', 'progressive', 'takes', 'parallel', 'eradicate', 'golf', 'scores', 'world', 'series', 'akron', 'ohio', '2.1', 'nec', 'round', '7,149', 'yard', '70', 'firestone', 'c.c', 'course', 'players', 'unless', 'stated', '66', 'paul', 'goydos', 'billy', 'mayfair', 'hidemichi', 'tanaka', 'japan', '68', 'steve', 'stricker', '69', 'justin', 'leonard', 'mark', 'brooks', 'tim', 'herron', 'duffy', 'waldorf', 'davis', 'love', 'anders', 'forsbrand', 'nick', 'faldo', 'cook', 'phil', 'mickelson', 'greg', 'norman', 'australia', '71', 'ernie', 'els', 'south', 'africa', 'scott', 'hoch', '72', 'clarence', 'loren', 'roberts', 'fred', 'funk', 'sven', 'struver', 'alexander', 'cejka', 'hal', 'sutton', 'tom', '73', 'd.a.', 'weibring', 'brad', 'bryant', 'craig', 'parry', 'stewart', 'ginn', 'corey', 'pavin', 'stadler', \"o'meara\", 'couples', '74', 'stankowski', 'costantino', 'rocca', 'italy', '75', 'jim', 'furyk', 'satoshi', 'higashi', 'willie', 'wood', 'shigeki', 'maruyama', 'mccarron', '77', 'wayne', 'westner', 'schneiter', '79', 'watson', 'seiki', 'okuda', 'soccer', 'gloria', 'bistrita', 'beat', '2-1', 'f.c.', 'valletta', 'romania', 'halftime', '1-1', 'malta', 'cup', 'winners', 'match', 'leg', 'preliminary', 'scorers', 'ilie', 'lazar', '32nd', 'eugen', 'voica', '84th', 'la', 'gilbert', 'agius', '24th', 'attendance', '4-2', 'aggregate', 'qualified', 'reuter', 'horse', 'racing', 'pivotal', 'ends', '25-year', 'wait', 'trainer', 'prescott', 'york', 'sir', 'landed', 'victory', '25', 'sprinter', '100-30', 'chance', 'nunthorpe', 'stakes', 'three-year-old', 'partnered', 'veteran', 'george', 'duffield', 'snatched', 'head', 'verdict', 'stride', 'deny', 'eveningperformance', '16-1', 'trained', 'henry', 'candy', 'ridden', 'chris', 'rutter', 'hever', '11-4', 'prix', 'l', 'abbaye', 'winner', 'longchamp', 'finished', 'lengths', 'away', '7-4', 'mind', 'games', 'fourth', 'royal', 'ascot', 'aimed', 'season', 'sprint', 'race', 'reluctant', 'go', 'enclosure', 'result', 'photo-finish', 'twenty-five', 'never', 'so', 'thought', 'better', 'bit', 'longer', 'sad', 'am', 'godfather', 'daughter', 'jack', 'berry', 'gone', 'search', 'success', 'around', 'profession', 'i`m', 'disappointed', 'feel', 'suicidal', 'furlongs', 'metres', 'just', 'quicken', 'two-year-olds', 'upwards', 'run', 'five', 'km', '1.', '2.', '3.', 'jason', 'weaver', 'eight', 'ran', '4th', 'distances', '1-1/4', 'owned', 'cheveley', 'park', 'stud', 'newmarket', '72,464', 'sterling', '112,200', 'tennis', 'toshiba', 'classic', 'carlsbad', 'california', '1996-08-21', '450,000', 'tournament', 'prefix', 'denotes', 'seeding', 'arantxa', 'sanchez', 'vicario', 'spain', 'naoko', 'kijimuta', '1-6', '6-4', '6-3', '4', 'kimiko', 'yone', 'kamio', '6-2', '7-5', 'sandrine', 'testud', '7', 'sugiyama', '4-6', '8', 'nathalie', 'tauziat', 'shi-ting', 'wang', 'hamlet', 'commack', 'waldbaum', 'michael', 'chang', 'sergi', 'bruguera', 'joyce', '3', 'richey', 'reneberg', '3-6', 'martin', 'damm', 'czech', '6', 'younes', 'el', 'aynaoui', 'morocco', '5-7', '3-0', 'retired', 'karol', 'kucera', 'slovakia', 'hicham', 'arazi', '7-6', 'dalglish', 'parting', 'kenny', 'spoke', 'sadness', 'leaving', 'club', 'premier', 'league', 'title', '1994-95', 'parted', 'mutual', 'consent', 'ex-manager', 'confessed', 'taking', 'division', 'local', 'newspaper', 'holiday', 'same', 'opinion', 'albeit', 'little', 'opened', 'my', 'mouth', 'stayed', 'way', 'let', 'get', 'job', 'conclusion', 'then', 'past', '15', 'director', 'football', 'cricket', 'county', 'championship', 'play', 'four-day', 'matches', 'weston-super-mare', 'durham', '326', 'd.', 'cox', 's.', 'campbell', ';', 'g.', '7-73', 'somerset', '236-4', 'm.', 'lathwell', '85', 'firsy', 'colchester', 'gloucestershire', '280', 'j.', 'russell', '63', 'a.', 'symonds', '52', 'cowan', '5-68', 'essex', '72-0', 'cardiff', 'kent', '128-1', 'walker', '59', 'fulton', 'v', 'glamorgan', 'leicester', 'leicestershire', '343-8', 'p.', 'simmons', '108', 'nixon', '67', 'hampshire', 'northampton', 'sussex', '368-7', 'n.', 'lenham', '145', 'v.', 'drakes', '51', 'northamptonshire', 'trent', 'nottinghamshire', '392-6', 'archer', '143', 'dowman', '107', 'surrey', 'worcester', 'warwickshire', '255-9', 'giles', '57', 'w.', 'khan', 'worcestershire', 'headingley', 'yorkshire', '305-5', 'c.', 'white', 'moxon', 'vaughan', 'lancashire', 'final', 'scoreboard', 'oval', 'innings', 'atherton', 'b', 'waqar', 'younis', 'mushtaq', 'ahmed', '44', 'hussain', 'c', 'saeed', 'anwar', 'thorpe', 'lbw', 'mohammad', 'akram', '54', 'crawley', '94', 'knight', '17', 'lewis', 'wasim', 'i.', 'salisbury', 'extras', 'lb-11', 'w-1', 'nb-8', 'wickets', '278', 'fall', '1-64', '2-85', '3-116', '4-205', '5-248', '6-273', 'bat', 'r.', 'croft', 'cork', 'mullally', 'bowling', '25-8-61-1', '20-6-70-2', '12-1-41-1', '27-5-78-2', 'aamir', 'sohail', '6-1-17-0', 'ijaz', 'inzamam-ul-haq', 'salim', 'malik', 'asif', 'mujtaba', 'moin', 'akam', 'ferguson', 'scottish', 'squad', 'glasgow', 'everton', 'duncan', 'scored', 'manchester', 'picked', '20-month', 'rangers', 'striker', 'ally', 'mccoist', 'another', 'man', 'form', 'hat-tricks', 'four', 'named', 'qualifier', 'austria', 'vienna', 'served', 'jail', 'head-butting', 'opponent', 'scotland', 'caps', 'december', '1994', 'brown', \"'ve\", 'watched', 'bang', 'great', 'scoring', 'moment', 'celtic', 'jackie', 'mcnamara', 'successful', 'under-21', 'earns', 'call-up', '100-2', 'lunch', 'keane', 'signs', 'four-year', 'ireland', 'midfielder', 'roy', 'signed', 'f.a.', 'champions', 'deal', 'game', 'delighted', 'alex', 'canadian', 'daniel', 'nestor', 'canada', 'thomas', 'muster', 'mikael', 'tillstrom', 'goran', 'ivanisevic', 'croatia', '6-7', '3-7', 'ferreira', 'jiri', 'novak', 'marcelo', 'rios', 'chile', 'kenneth', 'carlsen', 'denmark', 'malivai', 'corretja', 'todd', 'renzo', 'furlan', '7-3', 'philippoussis', 'marc', 'rosset', 'switzerland', '8-6', '9', 'cedric', 'pioline', 'gregory', 'carraz', '7-1', 'patrick', 'rafter', '11', 'alberto', 'berasategui', '6-1', 'petr', 'korda', 'francisco', 'clavet', 'vacek', '13', 'stoltenberg', '13-11', 'woodbridge', 'sebastien', 'lareau', \"o'brien\", 'byron', 'zimbabwe', '7-2', 'bohdan', 'ulihrach', 'andrea', 'gaudenzi', 'henman', 'woodruff', 'walkover', 'millns', 'boland', 'cape', 'provincial', 'fast', 'bowler', 'toured', '1992/93', 'replaces', 'all-rounder', 'phillip', 'defreitas', 'professional', 'tirana', 'qualifying', 'flamurtari', 'vlore', 'chemlon', 'humenne', '0-0', 'lubarskij', '50th', 'minute', 'valkucak', '54th', '5,000', 'win', 'chorzow', 'ruch', 'llansantffraid', 'wales', '1-0', 'arkadiusz', 'bak', '1st', '55th', 'arwel', '47th', 'miroslav', '62nd', '63rd', '6,500', 'larnaca', 'aek', 'cyprus', 'kotaik', 'abovyan', 'armenia', '2-0', 'zoran', 'kundic', '28th', 'klimis', 'alexandrou', '41st', 'milenko', 'kovasevic', '60th', 'penalty', 'koprinovic', '82nd', 'pavlos', 'markou', '5-1', 'siauliai', 'kareda', 'lithuania', 'sion', 'agrregate', 'vinnytsya', 'nyva', 'tallinna', 'sadam', 'estonia', '3,000', 'score', '2-2', 'goals', 'rule', 'bergen', 'brann', 'norway', 'shelbourne', 'mons', 'ivar', 'mjelde', '10th', 'ove', 'pedersen', '72nd', 'rutherford', '5th', '2,189', '5-2', 'sofia', 'levski', 'bulgaria', 'olimpija', 'slovenia', 'scorer', 'ilian', 'simeonov', '58th', '25,000', '4-3', 'penalties', 'vaduz', 'liechtenstein', 'raf', 'riga', 'latvia', 'daniele', 'polverino', '90th', 'agrins', 'zarins', 'luxembourg', 'varteks', 'varazdin', 'drazen', 'beser', 'miljenko', 'mumler', '78th', 'jamir', 'cvetko', '87th', 'torshavn', 'havnar', 'boltfelag', 'faroe', 'islands', 'dynamo', 'batumi', 'georgia', '0-2', '9-0', 'prague', 'sparta', 'glentoran', '4-0', 'gunda', '26th', 'lumir', 'mistr', '19th', 'horst', 'siegl', '48th', '80th', 'zdenek', 'svoboda', '76th', 'gabriel', '86th', '10-1', 'edinburgh', 'hearts', 'star', 'belgrade', 'yugoslavia', 'dave', 'mcpherson', '44th', 'vinko', 'marinovic', '59th', '15,062', 'rishon-lezion', 'hapoel', 'ironi', 'constructorul', 'chisinau', 'moldova', '3-3', 'anjalonkoski', 'mypa-47', 'karabach', 'agdam', 'azerbaijan', 'skopje', 'sloga', 'jugomagnat', 'macedonia', 'kispest', 'honved', 'hungary', 'add', 'rishon', 'moshe', 'sabag', 'nissan', 'kapeta', 'tomas', 'cibola', 'constructorol', 'sergei', 'rogachev', '42nd', 'gennadi', 'skidan', '1,500', 'gothenburg', 'ferencvaros', 'euro', 'budapest', 'ifk', 'drew', 'tie', 'played', '4-1', 'ferenc', 'horvath', '15th', 'andreas', 'andersson', '9,000', 'brazilian', 'rio', 'janeiro', 'midweek', 'bahia', 'atletico', 'paranaense', 'corinthians', 'guarani', 'coritiba', 'mineiro', 'cruzeiro', 'vitoria', 'flamengo', 'juventude', 'goias', 'sport', 'recife', 'gremio', 'bragantino', 'palmeiras', 'vasco', 'da', 'gama', 'portuguesa', 'parana', 'newcombe', 'ponders', 'sydney', 'captain', 'signalled', 'resignation', 'loses', 'wimbledon', 'champion', 'coach', 'tony', 'roche', 'determined', 'events', 'split', 'lose', 'look', 'giving', 'someone', 'else', 'telegraph', 'clay', '20-22', 'leadership', 'relegated', 'elite', '26-time', 'slipped', 'rank', 'neale', 'fraser', 'tandem', 'doubles', 'partner', 'wins', 'losses', 'selected', 'semifinalist', 'olympic', 'woodforde', 'croatians', 'boasts', 'conceded', 'hard-pressed', 'croatian', 'breath', 'absolute', 'best', 'described', 'toughest', 'faced', '1986', 'beaten', 'finalists', 'ago', 'guidance', 'badminton', 'malaysian', 'kuala', 'lumpur', 'singles', '9/16', 'luo', 'yigang', 'hwang', 'sun-ho', 'korea', '15-3', '15-7', 'wong', 'malaysia', 'abdul', 'samad', 'ismail', '16-18', '15-2', '17-14', 'kantharoopan', '3/4', 'jeroen', 'dijk', 'netherlands', '15-11', '18-14', 'wijaya', 'indra', 'indonesia', 'pang', 'chen', '15-6', '6-15', 'hu', 'zhilan', 'nunung', 'subandoro', '5-15', '18-15', 'hermawan', 'susanto', 'fung', 'permadi', '15-8', '15-12', 'women', '2nd', 'cindana', '11-3', '1ama', 'margit', 'borg', '11-6', 'sun', 'jian', 'marina', 'andrievskaqya', '11-8', '11-2', 'meluawati', 'chia', 'fong', '11-1', 'gong', 'zhichao', 'liu', 'lufung', '6-11', '11-7', 'zeng', 'yaqiong', 'li', 'feng', 'zealand', '11-9', 'christine', 'magnusson', 'ishwari', 'boopathy', '10-12', 'zhang', 'ning', 'olivia', 'draw', 'championships', 'beginning', 'u.s', 'centre', 'pete', 'sampras', 'vs.', 'adrian', 'voinea', 'magnus', 'larsson', 'volkov', 'vs', 'andrei', 'olhovskiy', 'roberto', 'carretero', 'jordi', 'burillo', '------------------------', 'jonas', 'bjorkman', 'christian', 'rudd', 'rikl', 'sjeng', 'schalken', 'schaller', 'grant', 'stafford', 'guy', 'forget', 'fernando', 'meligeni', 'brazil', 'yevgeny', 'kafelnikov', 'chesnokov', 'draper', 'galo', 'blanco', 'johansson', 'hendrik', 'dreekman', 'rusedski', 'medvedev', 'jean-philippe', 'fleurian', 'kroslak', '14', 'costa', 'younnes', 'shuzo', 'matsuoka', 'doug', 'flach', 'mats', 'wilander', 'haarhuis', 'tebbutt', 'jonathan', 'stark', 'bernd', 'karbacher', 'stefan', 'edberg', 'richard', 'krajicek', 'andre', 'agassi', 'mauricio', 'hadad', 'colombia', 'marcos', 'ondruska', 'felix', 'mantilla', 'carlos', 'moya', 'humphries', 'siemerink', 'carl-uwe', 'steeb', 'wheaton', 'kevin', 'kim', 'nicolas', 'lapentti', 'ecuador', 'karim', 'alami', 'enqvist', 'stephane', 'simian', 'guillaume', 'raoux', 'filip', 'dewulf', 'belgium', 'knowles', 'bahamas', 'filippini', 'uruguay', 'kris', 'goossens', 'stich', 'chuck', 'adams', 'javier', 'frana', 'argentina', 'courier', 'grabb', 'sandon', 'stolle', 'stefano', 'pescosolido', 'arnaud', 'boetsch', 'pereira', 'venezuela', 'gustafsson', 'jeff', 'tarango', 'radulescu', 'jared', 'palmer', 'hernan', 'gumy', 'nicklas', 'kulti', 'jakob', 'hlasek', 'cecil', 'mamiit', 'vince', 'spadea', 'prinosil', 'carbonell', 'baseball', 'orioles', 'davey', 'johnson', 'hospitalized', 'baltimore', 'miss', 'seattle', 'mariners', 'hospital', 'irregular', 'heartbeat', '53-year-old', 'experiencing', 'dizziness', 'treated', 'observed', 'physician', 'dr.', 'william', 'goldiner', 'adding', 'released', 'bench', 'andy', 'etchebarren', 'manage', 'absence', 'angels', 'skipper', 'columbia', 'presbyterian', 'blood', 'clot', 'calf', 'seasons', 'off-season', 'replacing', 'regan', 'cincinnati', 'reds', 'guided', 'mets', 'pull', 'within', 'slumping', 'yankees', 'american', 'major', 'standings', 'tabulate', 'lost', 'winning', 'percentage', 'eastern', 'w', 'gb', '.576', '58', '.536', 'boston', '64', '.496', '.457', 'detroit', '82', '.349', '28', 'central', 'cleveland', '.598', '.539', 'minnesota', '.500', 'milwaukee', '60', '.469', 'kansas', '.453', '18', 'western', 'texas', '.575', '61', '.512', 'oakland', '62', '.481', '.460', 'atlanta', '46', '.632', 'montreal', '.461', 'philadelphia', '.409', 'houston', '.535', 'st', 'louis', '.532', '.504', 'pittsburgh', '.421', 'san', 'diego', '.543', 'los', 'angeles', '.524', 'colorado', '65', '.435', 'greer', 'homer', 'lifts', 'indians', 'rusty', 'two-run', 'inning', 'rallied', '10-8', 'rubber', 'three-game', 'pitch', 'julian', 'tavarez', '4-7', 'right-field', 'fence', 'off-speed', 'tried', 'swing', 'big', 'crowd', 'intense', 'shot', 'ivan', 'rodriguez', 'double', 'catcher', 'mickey', 'cochrane', 'johnny', 'terry', 'kennedy', 'catchers', '40', 'nine', 'meetings', 'jacobs', 'field', 'joining', 'teams', 'a.l.', 'extra', 'ninth', 'lofton', 'single', 'ed', 'vosberg', 'blew', 'save', 'got', 'allowing', 'hits', 'walks', 'strikeouts', '2/3', 'scoreless', 'dean', '30th', 'cal', 'ripken', 'fifth-inning', 'solo', 'bobby', 'bonilla', 'three-run', 'seventh', 'power', 'surging', '10-5', 'runs', 'fifth', '5-5', 'bottom', '21st', 'starter', 'hitchcock', '12-6', 'blast', 'randy', 'cy', 'young', 'allowed', 'relief', 'appearances', 'disabled', 'rbi', 'cut', 'erickson', '8-10', 'laboured', 'homers', 'dropped', 'row', 'became', 'shortstop', 'major-league', 'history', '34', 'hoiles', '22nd', 'dickson', 'scattered', '1/3', 'debut', 'chili', 'belted', 'each', 'plate', 'derek', 'jeter', 'settled', '27th', 'pitcher', 'tying', 'jimmy', 'key', '9-10', 'baserunners', 'interim', 'mike', 'stanley', 'bases-loaded', 'eighth-inning', 'sox', 'athletics', 'owns', '.367', 'career', 'batting', 'bases', 'loaded', '33-for-90', 'mo', 'vaughn', 'went', '3-for-3', 'walk', 'stole', 'collected', '116th', 'brosius', 'homered', 'drove', 'ausmus', 'capped', 'four-run', 'eighth', 'tigers', 'reeling', 'consecutive', 'dropping', 'juan', 'guzman', 'tossed', 'complete-game', 'six-hitter', 'league-best', 'era', 'blue', 'jays', 'royals', 'span', 'earned', 'lowered', '2.99', 'jaha', 'five-run', 'brewers', '10-7', 'twins', 'jose', 'valentin', 'cocu', 'psv', 'spur', 'eindhoven', 'nijmegen', 'bicycle', 'kick', 'minutes', 'arthur', 'numan', 'luc', 'nilis', 'marksmen', 'ajax', 'defence', 'nac', 'breda', 'eykeren', '11th', '67th', '1-2', 'sharpshooter', 'knup', 'swiss', 'geneva', 'galatasaray', '26', 'internationals', 'recalled', 'baku', 'overlooked', 'artur', 'jorge', 'finals', 'rolf', 'fringer', 'clearly', '19-man', 'progress', 'beyond', 'phase', 'goalkeepers', 'marco', 'pascolo', 'cagliari', 'pascal', 'zuberbuehler', 'grasshoppers', 'defenders', 'henchoz', 'hamburg', 'hottiger', 'yvan', 'quentin', 'ramon', 'vega', 'raphael', 'wicky', 'midfielders', 'alexandre', 'comisetti', 'antonio', 'esposito', 'fournier', 'stuttgart', 'christophe', 'ohrel', 'lausanne', 'sylvestre', 'sesa', 'servette', 'ciriaco', 'sforza', 'inter', 'milan', 'murat', 'yakin', 'strikers', 'kubilay', 'turkyilmaz', 'bonvin', 'chapuisat', 'borussia', 'dortmund', '40,000', 'beers', 'house', 'spectators', 'grand', 'incentive', 'cheer', 'athletes', 'performances', 'glass', 'beer', 'belgian', 'brewery', 'drinks', 'goes', 'organisers', 'expensive', 'rounds', 'ever', 'already', 'records', 'broken', '1,000', 'broadhurst', 'raymond', 'ian', 'woosnam', 'bernhard', 'langer', 'ronan', 'rafferty', 'lanner', 'riley', 'eamonn', 'darcy', 'nyman', 'claydon', 'roe', 'retief', 'goosen', 'carl', 'suneson', 'stephen', 'lawrie', 'pyman', 'max', 'anglert', 'miles', 'tunnicliff', 'cevaer', 'des', 'smyth', 'carter', 'lee', 'westwood', 'chalmers', 'miguel', 'angel', 'bjorn', 'roca', 'derrick', 'cooper', 'hawksworth', 'padraig', 'harrington', 'welch', 'gogele', 'mcginley', 'gary', 'orr', 'jose-maria', 'canizares', 'jonzon', 'eales', 'williams', 'andrew', 'coltart', 'lomas', 'rivero', 'robert', 'karlsson', 'marcus', 'wills', 'pedro', 'linhart', 'jamie', 'spence', 'pinero', 'mouland', 'uefa', 'rewards', 'rewarded', 'additional', '1997-98', 'headed', 'rankings', '1995-96', '8.62', '8.61', '8.57', 'formula', 'account', 'factors', 'including', 'yellow', 'cards', 'coaching', 'behaviour', 'clubs', 'allocated', 'places', '4.', '8.56', '5.', '8.54', '6.', '8.52', '7.', '8.45', '8.', 'belarus', '8.39', '9.', 'iceland', '8.35', '10.', '8.30', '13.', '8.29', '15.', '8.24', '16.', '8.22', '18.', '8.20', '19.', '8.18', '20.', '8.17', '21.', '8.15', '23.', '8.12', 'portugal', '25.', '8.10', '26.', '8.09', '29.', '8.07', '30.', '8.06', '31.', '8.05', '32.', '8.03', '33.', '8.02', '35.', '7.98', '36.', '7.95', '37.', 'greece', '7.89', '39.', '7.85', '40.', '7.83', '41.', '7.80', '42.', '7.77', '43.', '7.75', '44.', '7.73', '45.', '7.40', 'police', 'commandos', 'australians', 'colombo', 'patrolled', 'ground', 'tour', 'sri', 'lanka', 'youth', 'limited', 'overs', 'includes', 'india', 'promised', 'presence', 'sniffer', 'dogs', 'plainclothes', 'policemen', 'trouble-free', 'making', 'boycotting', 'fixture', 'ethnic', 'violence', 'warm-up', '251', 'ricky', 'ponting', '119', 'balls', 'sixes', 'fours', 'retiring', 'replied', '246', 'geoff', 'marsh', 'impressed', 'competitiveness', 'made', 'sweat', 'romanian', 'dies', 'bus', 'crash', 'others', 'injured', 'romanian-registered', 'collided', 'bulgarian', 'buses', \"o'clock\", 'morning', 'road', 'towns', 'rousse', 'veliko', 'tarnovo', 'woman', 'maria', '35', 'accident', 'investigated', '359-2-84561', 'journal', 'contents', 'oj', '211', '*', 'note', 'displayed', 'reverse', 'order', 'printed', 'corrigendum', 'regulation', 'ec', '1464/96', 'relating', 'invitation', 'tender', 'levies', 'refunds', 'sugar', '187', '26.7.1996', '658/96', 'certain', 'granting', 'compensatory', 'payments', 'system', 'producers', 'arable', 'crops', '91', '12.4.1996', '1663/96', 'establishing', 'values', 'determining', 'entry', 'fruit', 'vegetables', 'document', 'appeal', 'payment', 'denial', 'minnetonka', 'minn', 'district', 'court', 'minneapolis', 'decision', 'financing', 'administration', 'hcfa', 'reimbursement', 'medicaid', 'administrator', 'reversed', 'previously', 'favorable', 'regarding', 'related', 'community', 'liaison', 'personnel', 'continues', 'believe', 'majority', 'coverable', 'terms', 'medicare', 'program', 'optimistic', 'ultimate', 'resolution', 'gildea', 'recorded', 'reserve', 'equal', 'ruled', 'favor', 'expenses', '81,000', 'disputed', 'distrct', 'dispute', 'pleased', 'recognize', 'significant', 'toward', 'disputes', 'newsdesk', '312-408-8787', 'oppenheimer', 'oct.', 'div', 'lp', 'distribution', 'rate', 'quarterly', 'assuming', 'improved', 'declared', '0.65', 'partnership', 'unit', 'sees', 'richmond', 'va', 'products', 'co', 'second-quarter', '34.6', 'retailer', 'annual', 'even', 'bankruptcy', 'consideration', 'emerged', 'chapter', '3-1/2', 'always', 'particularly', 'you', 'something', 'striving', 'richmond-based', '95.7', 'second-largest', 'stores', 'closing', 'lease', 'agreements', 'plan', 'operates', '169', '29', '7.1', '0.23', '311.9', 'measles', 'exposure', 'bowel', '1996-08-23', 'pregnant', 'babies', 'crohn', 'debilitating', 'disorder', 'researchers', 'born', 'mothers', 'caught', 'developed', 'cases', 'dr', 'wakefield', 'school', 'medicine', 'colleagues', 'screened', 'delivered', 'university', 'uppsala', '1940', '1949', 'children', 'wrote', 'lancet', 'medical', 'inflammation', 'sometimes', 'require', 'surgery', 'causes', 'diarrhoea', 'abdominal', 'pain', 'weight', 'involved', 'especially', 'severe', 'viruses', 'often', 'cause', 'birth', 'defects', 'notably', 'rubella', 'high', 'stillborn', 'baby', 'cbi', 'industrial', 'survey', 'manufacturing', 'confederation', 'enquiry', 'book', 'stocks', 'goods', '+17', '+19', '+25', 'expectations', '+22', '+12', '+16', '+6', '+4', 'replying', 'above', 'normal', 'below', '1,305', 'companies', 'representing', 'industries', 'accounting', 'manufactured', 'employees', 'rosemary', 'bennett', '7715', 'shipsales', 'secondhand', 'tonnage', 'brokers', 'vessels', 'iron', 'gippsland', 'built', '1989', '87,241', 'dwt', 'sairyu', 'maru', '1982', '60,960', '15.5', 'stainless', '21,718', 'subject', 'inspection', 'garlic', 'pills', 'cholesterol', 'finds', 'studies', 'show', 'flawed', 'doctors', 'oxford', 'benefit', 'significantly', 'tablets', '115', 'levels', '900', 'milligrams', 'dried', 'powder', 'placebo', 'differences', 'groups', 'receiving', 'college', 'physicians', 'low-fat', 'diet', 'measured', 'six-week', 'findings', 'accurate', 'several', 'pressure', 'either', 'trials', 'interpreted', 'incorrectly', 'special', 'diets', 'beforehand', 'duration', 'six-month', 'trial', 'funded', 'heart', 'foundation', 'lichtwer', 'pharma', 'gmbh', 'makes', 'kwai', 'brand', 'address', 'whole', 'affect', '7950', 'gives', 'aid', 'volcano-hit', 'caribbean', '39', 'development', 'montserrat', 'much', 'population', 'living', 'fled', 'volcano', 'soufriere', 'hills', 'times', '4,500', 'plymouth', 'evacuated', 'shelters', 'schools', 'assistance', 'provide', 'track', 'designated', 'area', '8.5', 'dependent', 'territories', 'active', 'lynda', 'chalker', 'recent', 'census', 'shown', 'montserratians', 'remain', 'she', 'looms', 'bill', 'berkrot', 'slam', 'seed', 'steffi', 'graf', 'aiming', 'able', 'ease', 'begins', 'opens', 'crown', 'top-ranked', 'yayuk', 'basuki', 'ceremony', 'revealed', 'holders', 'looming', 'third-round', 'nemesis', 'rising', 'avenged', 'defeat', '19-year-old', 'hitter', 'first-week', 'fireworks', 'stunning', 'upset', 'sailing', 'predictable', 'semifinal', 'showdown', 'tested', 'probably', '28th-ranked', 'natasha', 'zvereva', 'repeat', 'eighth-ranked', 'landing', 'bumping', 'sixth', 'avoided', 'possibility', 'quarter-finals', 'lock', 'horns', 'semis', 'surprise', 'ranked', 'monica', 'seles', 'anne', 'miller', 'victim', 'second-ranked', 'austrian', 'seeded', 'luck', 'faces', 'playing', 'survives', 'fifth-seeded', '12th-seeded', 'perhaps', 'yet', 'unfortunate', 'first-round', 'matchup', 'pits', 'popular', 'swede', 'two-time', 'farewell', 'one-match', 'affair', 'exception', 'looks', 'comfortable', 'likes', 'frenchman', 'ailing', 'nursing', 'rib', 'injury', 'path', 'runner-up', 'fifth-ranked', 'anke', 'huber', 'conchita', 'martinez', 'eighth-seeded', 'lindsay', 'davenport', 'looking', 'opponents', 'encounter', '18th-ranked', 'amanda', 'coetzer', 'talent', 'martina', 'hingis', '16th', 'probable', 'quarter-final', 'clash', 'seventh-seeded', 'jana', 'novotna', 'ruxandra', 'dragomir', '61-2', '9373-1800', 'rtrs', 'top-seeded', '123rd-ranked', 'lefthander', 'rallies', 'constantly', 'attacking', 'tactic', 'worked', 'second-round', 'bye', 'along', 'seeds', 'second-seeded', '6-7(3-7', 'unseeded', 'advancing', 'seeed', 'eliminated', 'hour', '55', 'saved', 'point', '5-6', 'third-set', 'break', 'compatriot', '13th', 'fortunate', '9-8', 'marathon', 'knew', 'ranks', 'breaks', 'lanky', 'strokes', 'joking', 'chipping', 'charging', 'serving', 'volleying', 'really', 'timing', 'baseline', 'chances', 'every', 'come', 'lights', 'maybe', 'difference', '2-5', 'deficit', 'erratically', '44th-ranked', 'famous', '32', 'aces', 'outplayed', '24-year-old', 'sixth-ranked', 'indianapolis', 'quick', 'getaway', 'arrived', 'feeling', 'soon', 'unfocused', 'calm', 'nervy', \"'m\", 'fought', 'tiebreak', 'serves', 'hoped', 'tight', 'shanked', 'forehand', '5-all', 'helped', 'korean', 'pro-soccer', 'seoul', 'anyang', 'chonnam', 'puchon', 'suwon', 'drawn', 'd', 'g', 'f', 'p', 'chonan', 'pohang', 'pusan', 'ulsan', 'chonbuk', 'senegal', 'cholera', 'outbreak', 'kills', 'dakar', 'kaolack', '291', 'doctor', 'masserigne', 'ndiaye', 'staff', 'overwhelmed', 'rushing', 'symptoms', 'appear', 'deaths', '160', 'southeast', 'senegalese', 'nigerian', 'liberia', 'ecomog', 'monrovia', 'sam', 'victor', 'malu', 'commander', 'peacekeeping', 'latest', 'civil', 'inienger', 'officers', 'handover', 'dozen', 'accords', 'difficult', 'challenging', 'painful', 'peacekeepers', 'harassed', 'assure', 'sight', 'nations', 'observers', 'travelling', 'tubmanburg', 'monitor', 'delayed', 'shooting', 'highway', 'anthony', 'nyakyi', 'finally', 'escort', 'ulimo-j', 'faction', 'abuja', 'saturday', 'breaking', 'foresees', 'disarmament', '60,000', 'combatants', '10,000', 'height', 'guinea', 'prayer', 'conakry', 'broadcast', 'repeatedly', 'dead', 'prosperity', 'precise', 'reason', 'clear', 'lansana', 'conte', 'vice-president', 'organisation', 'conference', 'prepare', 'oic', 'koranic', 'reading', 'sessions', 'prayers', 'farming', 'badi-tondon', 'army', 'survived', 'revolt', 'veiled', 'topple', 'ordered', 'crackdown', 'corruption', 'seized', '1984', 'death', 'marxist', 'sekou', 'toure', '1993', 'answers', 'bottle', 'johannesburg', 'boy', 'writing', 'girl', 'whose', 'washed', 'nelson', 'mandela', 'old', 'prison', 'carlo', 'hoffmann', '11-year-old', 'jailer', 'son', 'beach', 'robben', 'winter', 'storms', 'letter', 'ordinary', 'mail', 'post', 'danielle', 'murray', 'sandusky', 'age', 'penfriend', 'reply', 'whoever', 'flung', 'journey', 'atlantic', 'ocean', 'rottweiler', 'toddler', 'dog', 'belonging', 'elderly', 'couple', 'savaged', 'two-year-old', 'grandson', 'booy', 'garden', 'grandparents', 'vanderbijlpark', 'bloody', 'body', 'lying', 'parents', 'pick', 'unclear', 'fierce', 'enough', 'scare', 'burglars', 'becoming', 'increasingly', 'crime-infested', 'indicators', 'updated', 'cpi', '+0.4m', 'm', '23.0yr', '+0.9;+23.6', 'ppi', '+0.7', 'm;+21.5yr', '+1.7;+22.0', '7.8', 'm;-0.2yr', '+7.3;-3.6', 'jan-may', '738', '748', 'nbh', '934', '774', 'mit', 'jan-june', '1.45', 'bln', '1.24', 'gross', '27,246.5', '28,716.8', '14,390.7', '15,704.3', 'unemployment', '10.8', '10.6', 'budget', 'huf', 'jan-july', '102', '122', 't-bill', 'yields', '%', '1mo', '22.95', '3mo', '23.02', '6mo', '23.53', '1yr', '24.40', '2-yr', '1998', 'j', '25.49,(3-yr', '24.44', 'bbb-minus', 'duff', '&', 'phelps', 'ibca', 'thomson', 'bankwatch', 'bb-plus', 'ba1', 'investors', 'bbb+', 'credit', 'flow', '36', '1)266', '2410', 'fifty', 'die', 'rebels-interfax', 'least', 'servicemen', 'separatist', 'chechen', 'grozny', 'interfax', 'command', 'chechnya', '200', 'interior', 'reconaisance', 'mission', 'clashed', 'minutka', 'square', 'independently', 'confirmed', 'peacemaker', 'lebed', 'chief-of-staff', 'aslan', 'maskhadov', 'agreement', 'cease', 'hostilities', 'noon', '0800', 'detachment', '1500', 'raged', '1600', 'outnumbered', 'schoolgirl', 'blackmailer', 'textbooks', 'gdansk', 'blackmailed', 'letters', 'threatening', 'explained', 'money', '13-year-old', 'extract', 'zlotys', 'residents', 'sierakowice', 'lives', 'nearby', 'blackmail', 'railway', 'station', 'interviewed', 'psychologist', 'books', 'clothes', 'kazimierz', 'socha', 'case', 'poor', 'family', 'trouble', 'underage', 'offenders', 'cnb-120', 'index', 'pts', '869.3', 'broad', 'measure', 'equities', 'cnb', 'ten', 'sectoral', 'indices', 'banking', '14.4', '1,294.5', '42-2-2423-0003', 'sign', 'novye', 'atagi', 'boris', 'yeltsin', 'security', 'supremo', 'renewed', 'negotiated', 'village', 'officially', 'disclosed', 'itar-tass', 'provided', 'disengagement', 'aide', 'russian-chechen', 'detailed', 'barkhatov', 'rebel-held', 'progressing', 'briskly', 'mood', 'completed', 'signature', 'day-by-day', 'showed', 'clip', 'laughing', 'smiling', 'nominee', 'tatyana', 'dmitrieva', 'inaugurated', 'returned', 'kremlin', 'two-day', 'lakelands', 'northwestern', 'bosnia', 'sarajevo', 'oslobodjenje', 'bosnian', 'federation', 'launches', 'common', 'taxes', 'dinar', 'kuna', 'deutsche', 'currency', 'introduced', 'refugees', 'displaced', 'persons', 'mirhunisa', 'komarica', 'survivors', 'massacre', 'srebrenica', 'languishing', 'laborers', 'serbian', 'mines', '2,400', 'male', 'trepca', 'mine', '1,900', 'aleksandrovac', 'dnevni', 'avaz', 'slovenian', 'briefly', 'detain', 'ljubljana', 'cancel', 'maribor', '+387-71-663-864', 'overnight', 'raids', 'alkhan-yurt', 'pounded', 'planes', 'artillery', 'calmed', 'although', 'sporadic', 'explosions', 'heard', 'correspondent', 'lawrence', 'sheets', 'arrival', 'flew', 'firing', 'anything', 'clinched', 'separatists', 'halt', 'threatened', 'bombing', 'assault', 'boat', 'passengers', 'rescued', 'colombian', 'coast', 'bogota', 'guard', 'pacific', 'missing', 'tiny', 'gorgona', 'southwest', 'sightseers', 'trip', 'narino', 'fuel', 'navy', 'lt.', 'italo', 'pineda', 'boatman', 'coconuts', 'rainwater', 'sea', 'towed', 'buenaventura', 'argentine', 'raw', 'steel', '14.8', 'buenos', 'aires', '355,900', '1.9', 'center', 'primary', '297,700', '0.1', 'hot', 'laminate', 'production', '349,000', '0.8', 'cold', 'laminates', '120,500', '4.2', 'webb', '+541', '318-0655', 'peru', 'kill', 'jungle', 'lima', 'peruvian', 'northeastern', 'anti-', 'terrorist', 'sources', 'maoist', 'shining', 'alomella', 'robles', 'small', '345', '550', 'northeast', 'villagers', 'listen', 'propaganda', 'speeches', 'passing', 'motorists', 'daubed', 'slogans', 'whereabouts', 'severely', 'weakened', '1992', 'capture', 'abimael', 'stepping', 'activities', 'guerrilla', 'conflicts', 'cost', 'damage', 'infrastructure', '1980', 'surinam', 'paramaribo', 'flamboyant', 'surinamese', 'ronny', 'brunswijk', 'custody', 'charged', 'attempted', 'murder', 'turned', 'himself', 'freddy', 'pinas', 'surinamese-born', 'visitor', 'bar-room', 'brawl', 'mining', 'moengo', '56', '90', 'ro', 'gajadhar', 'showing', 'cuts', 'bruises', 'feared', 'shoot', 'objected', 'advances', 'wife', 'bodyguards', 'charges', 'merely', 'defended', 'less', 'thief', 'buttocks', 'uprising', 'regime', 'strongman', 'desi', 'bouterse', 'conflict', '500', 'caused', 'flee', 'neighbouring', 'guiana', '1980s', 'eventually', 'paved', 'businessman', 'logging', 'interests', 'manages', 'occasionally', 'noisy', 'saw', 'leads', 'thai', 'heroin', 'hideaway', 'bangkok', 'hong', 'kong', 'carpenter', 'arrested', 'seaside', 'pattaya', 'kg', '39.7', 'complaints', 'cheung', 'siu', 'searched', 'bags', 'hidden', 'hollow', 'spaces', 'wooden', 'planks', 'hired', 'hide', 'sawing', 'escaping', 'door', 'baht', 'hunting', 'collaborators', 'detained', 'pending', 'formal', 'downer', 'follows', 'friction', 'qian', 'qichen', 'consulate', 'sovereignty', 'colony', 'mid-1997', 'strained', 'uranium', 'issues', 'affecting', 'include', 'plans', 'pact', 'canberra', 'tibet', 'exiled', 'spiritual', 'dalai', 'lama', 'conservative', 'accuse', 'pa', 'nablus', 'bookseller', 'information', 'undertaking', 'distribute', 'written', 'critics', 'self-rule', 'deals', 'anyone', 'legal', 'destroy', 'amman', 'daoud', 'makkawi', 'owner', 'nablus-based', 'al-risala', 'bookshop', 'copies', 'edward', 'prominent', 'scholar', 'citizen', 'origin', 'outspoken', 'critic', 'accord', 'confiscated', 'israel-plo', 'director-general', 'mutawakel', 'taha', 'insisted', 'censor', 'strategy', 'suppress', 'freedom', 'expression', 'whatsoever', 'relevent', 'legislations', 'resulted', 'mistakes', 'explain', 'journalists', 'writers', 'authors', 'journalist', 'seale', 'banned', 'shop', 'sure', 'selling', 'think', 'afraid', '?', 'strip', 'jewish', 'handed', 'parts', 'blames', 'istanbul', 'tower', 'carrier', 'egyptair', 'airport', 'twenty', 'boeing', '707', 'overshot', 'runway', 'fire', 'taxi', 'skipped', 'onto', 'line', 'mohamed', 'fahim', 'rayyan', 'instead', '2,250', '2,460', 'yards', '3,300', 'steep', 'aviation', 'noted', 'pilot', 'misleading', 'rainstorm', 'wet', 'brake', 'medium', 'wrong', 'private', 'ihlas', 'wants', 'nothing', 'sudanese', 'rulers', 'egyptian', 'shelter', 'militants', 'hosni', 'mubarak', 'speech', 'moslem', 'addis', 'ababa', 'sponsored', 'council', 'flights', 'khartoum', 'incident', 'effect', 'sudan', 'fails', 'extradite', 'cannot', 'ethiopia', 'eager', 'turabi', 'whatever', 'academics', 'al-turabi', 'bitter', 'terrorists', 'sheltering', 'passorts', 'far', 'ostensibly', 'shares', 'shed', 'profit-taking', 'shedding', 'amid', 'imkb-100', '123.89', '64,178.78', 'totalled', '2.92', 'volume', '7.2', 'trillion', 'lira', 'actually', 'reaction', 'rise', '63,000', 'tomorrow', 'burcin', 'mavituna', 'profit', 'approached', '65,000', 'cheap', 'attracted', '67,000', 'pierced', 'session', 'isbank', 'gained', '8,600', 'utility', 'cukurova', '85-share', '0.47', '70,848.86', '15-share', '0.55', '55,929.89', '218', 'gainers', 'outdid', 'losers', 'stable', '+90-212-275', '0875', 'sa', 'universe', 'hides', 'veil', 'silence', 'kieran', 'las', 'cruces', 'n.m.', 'alicia', 'machado', 'mexico', 'questions', 'claims', '19', 'slipping', 'desert', 'attended', 'teen', 'usa', 'pageant', 'contestant', 'scrutiny', 'ultimatum', 'angeles-based', 'inc.', 'drop', 'losing', 'swollen', 'wisdom', 'teeth', 'extracted', 'marta', 'fajardo', 'weighed', '112', 'vegas', 'habits', 'everybody', 'addiction', 'eats', 'cakes', 'crazy', 'flatly', 'wraps', 'blocked', 'access', 'dressed', 'strapless', 'gown', 'heavier', 'contestants', 'rave', 'reviews', 'appearance', 'stage', 'kidding', 'fantastic', 'nikki', 'sexy', 'publicists', 'stay', 'promotional', 'sponsors', 'returning', 'beauty', 'queens', 'high-profile', 'personalities', 'alleged', 'eased', 'indulged', 'passion', 'pasta', 'cake', 'fat', 'putting', 'fine', 'wished', 'happened', 'spiritually', 'mentally', 'terrific', 'lifestyle', 'associated', 'routine', 'exercise', 'ability', 'regimented', 'workout', 'exist', 'dont', 'talked', 'kevorkian', 'attends', 'suicide', 'pontiac', 'mich', 'bringing', '40-year-old', 'missouri', 'suffering', 'multiple', 'sclerosis', 'emergency', 'room', 'aranosian', 'osteopathic', 'patricia', 'smith', 'lees', 'midday', 'paralysed', 'assisted-suicide', '37th', 'attending', 'starting', 'crusade', 'assisted', 'lawyer', 'geoffrey', 'fieger', 'husband', 'father', 'james', 'patients', 'location', 'rapidly', 'multple', 'louise', 'siebens', '76-year-old', 'amyotrophic', 'lateral', 'lou', 'gehrig', 'judith', 'curren', '42-year-old', 'massachusetts', 'suffered', 'chronic', 'fatigue', 'syndrome', 'non-terminal', 'life', 'fairview', '1.82', 'baa1', '08/21/96', 'issuer', 'tx', '1,820,000', '08/27/96', 'municipal', 'desk', '212-859-1650', 'defiant', 'neo-nazi', 'jailed', 'gray', 'sentenced', 'lauck', 'pumping', 'extremist', 'lincoln', 'nebraska', 'yelled', 'tirade', 'abuse', 'conviction', 'inciting', 'racial', 'hatred', 'struggle', '43-year-old', 'shouted', 'escorted', 'arguing', 'client', 'offence', 'hailed', 'neo-nazism', 'network', 'anti-semitic', 'material', 'flowing', '1970s', 'possessed', 'well-oiled', 'machine', 'honed', 'presiding', 'judge', 'guenter', 'bertram', 'cannon', 'extracts', 'praising', 'hitler', 'greatest', 'describing', 'nazi', 'slaughter', 'millions', 'jews', 'myth', 'bars', 'complex', 'prosecutor', 'mauruschat', 'offences', 'demanded', 'five-year', 'satisfied', 'sentence', 'publishing', 'distributing', 'illegal', 'argued', 'laws', 'meant', 'produce', 'swastika-covered', 'magazines', 'videos', 'flags', 'manfred', 'kanther', 'welcomed', 'prosecution', 'ringleaders', 'biggest', 'distributers', 'vicious', 'racist', 'publications', 'democrats', 'sober', 'suit', 'sporting', 'trademark', 'hitleresque', 'moustache', 'emotion', 'spent', 'explaining', 'blurted', 'virtually', 'incomprehensible', 'quick-fire', 'diatribe', 'neither', 'nazis', 'nor', 'communists', 'dared', 'kidnap', 'oblique', 'reference', 'extradition', 'truth', 'attorney', 'hans-otto', 'sieg', 'courtroom', 'judges', 'actions', 'carried', 'obsessed', 'nazism', 'devoted', 'workers', 'nsdap-ao', 'derives', 'name', 'three-month', 'dealt', 'ns', 'kampfruf', 'cry', 'magazine', 'references', 'aryan', 'supremacy', 'defamatory', 'statements', 'rejected', 'argument', 'request', 'convicted', 'disseminating', 'symbols', 'anti-constitutional', 'organisations', 'arrest', 'subtracted', 'un', 'occur', 'arrangements', 'implement', 'oil-for-food', 'quite', 'speculate', 'preparations', 'anxious', 'undersecretary-general', 'yasushi', 'akashi', 'sooner', 'monitors', 'carry', 'department', 'humanitarian', 'deputy', 'speculated', 'suspected', 'killers', 'bishop', 'algeria', 'tv', 'algerian', 'killing', 'state-run', 'sought', 'slain', 'assassination', 'roman', 'catholic', 'pierre', 'claverie', '58-year-old', 'bomb', 'oran', 'herve', 'charette', 'algiers', '50,000', 'algerians', '110', 'foreigners', 'pitting', 'radical', 'islamists', 'commanding', 'flown', 'january-july', 'table', 'shows', 'volumes', 'handled', 'airports', 'exclude', 'trucked', 'airfreight', 'adv', 'berlin', '17,844', '5.9', 'tegel', '10,896', '3.1', 'tempelhof', '202', '60.0', 'schoenefeld', '6,746', '16.8', 'bremen', '1,453', '13.1', 'dresden', '792', '11.4', 'duessseldorf', '31,347', '4.4', '768,269', '1.5', '21,240', '3.5', 'hannover', '6,030', '15.3', 'koeln', 'cologne', '182,887', '11.8', 'leipzig', 'halle', '1,806', '45.6', 'munich', '44,525', 'muenster', 'osnabrueck', '382', '28.2', 'nuremberg', '25,929', '17.8', 'saarbruecken', '626', '28.3', '10,655', '1,113,785', 'tel+44', '161', '7706', 'fax+44', '5017', 'paribas', 'repeats', 'aegon', 'company-------------price---broker----------------', '83.40', 'comment', '711', 'forecast', 'performance', 'reiterates', 'estimates', 'dfl', 'eps', 'e', 'dividend', '5.83', '13.8', '2.75', '6.59', '12.2', '3.10', 'fax', '5040', 'clinton', 'ballybunion', 'fans', 'dublin', 'resort', 'whirlwind', 'irish', 'america', 'dick', 'spring', 'convention', '26-29', 'bring', 'placards', 'waved', 'addressed', 'packed', 'backs', 'requested', 'guests', 'kennedys', 'frank', 'quilter', 'triumphant', 'process', 'observe', 'assurances', 'erdmann', 'wolfgang', 'ischinger', 'assured', 'valid', 'primakov', 'pledge', 'seek', 'solution', 'aegis', 'osce', 'quoting', 'klaus', 'kinkel', 'personal', 'urge', 'breakaway', 'threat', 'unauthorised', 'initiative', 'intention', 'positive', 'goldiman', 'responsible', 'delhi', 'global', 'nuclear', 'treaty', 'intended', 'i.k.', 'gujral', 'block', 'adoption', 'entering', 'signing', 'kind', 'weapons', '1974', 'assemble', 'veto', 'comprehensive', 'ctbt', 'bilateral', 'visualise', 'straining', 'text', 'position', 'clause', 'providing', 'modified', 'forwarded', 'assembly', 'cross', 'reiterated', 'objections', 'negotiation', 'fact', 'weapon', 'hegemony', 'concerns', 'impossible', 'oblige', 'option', 'exercised', 'restraint', 'carrying', 'tests', 'lone', 'accept', 'constraints', 'rely', 'arsenals', 'sour', 'dhaka', 'disquiet', 'bangladeshi', 'bangladesh', 'goverment', 'attached', 'importance', 'tragic', 'siraj', 'mia', 'under-secretary', 'commonwealth', 'liam', 'fox', 'interogation', 'arriving', 'bore', 'injuries', 'relatives', 'complained', 'murdered', 'post-mortem', 'tortured', 'drunk', 'wrist', 'act', 'seriously', 'reasons', 'important', 'relationship', 'leave', 'nepal', 'governments', 'commons', 'matter', 'thorough', 'investigation', 'outcome', 'harassment', 'nationals', 'criminal', 'immigration', 'connection', 'suburb', 'disrupt', 'kashmir', 'polls', 'srinagar', 'planning', 'troubled', 'jammu', 'seems', 'inderjit', 'gupta', '1987', 'clamped', 'direct', 'abetting', 'militancy', 'valley', 'islamabad', 'infiltrating', 'create', 'disturbance', 'noticed', 'among', 'growing', 'mercenaries', 'independence', '1947', 'h.d.', 'deve', 'gowda', 'centre-left', 'hopes', 'restore', 'normality', '20,000', 'insurgency-related', 'militant', 'engineering', 'banks', 'edged', 'sharply', 'institutional', 'stock', 'exchange', 'dse', 'all-share', '0.7', '1,156.79', 'turnover', '146.2', 'taka', 'remained', 'unchanged', '12.71', '228.7', 'cables', '20.37', '677.98', 'apex', 'tannery', '22.72', '597', 'recovered', 'edge', 'short-covering', 'ratio', 'governor', 'rangarajan', 'crr', 'maintained', 'reduced', 'addressing', 'industrialists', 'having', 'theoretical', 'supply', 'instrument', 'regulate', 'reducing', 'increasing', 'context', 'stood', 'commitment', 'response', '+91-11-3012024', 'viable', 'bombay', 'chakravarty', 'product', 'gdp', 'sustainable', 'currrent', 'real', '16-17', '14-15', 'non-debt', 'reduction', 'debt-service', '+91-22-265', '9000', 'teresa', 'calcutta', 'saint', 'gutters', 'nobel', 'prize', '1979', 'hope', 'dignity', 'unwanted', 'simple', 'heaps', 'honours', 'regards', 'nun', 'albanian', 'descent', 'maintains', 'joy', 'fulfilment', 'neglected', 'need', 'sympathy', 'pity', 'compassion', 'diminutive', 'missionary', 'respiratory', 'intensive', 'indian', 'turns', '86', 'conscious', 'condition', 'task', 'alone', 'slums', 'densely-populated', 'grew', 'characteristically', 'unworthy', 'showering', '80', 'bharat', 'ratna', 'jewel', 'highest', 'award', 'deteriorate', 'fitted', 'pacemaker', 'vatican', 'superior', 'missionaries', 'charity', 'delegates', 'elect', 'successor', 'agree', 'bacterial', 'pneumonia', 'rome', 'ribs', 'receive', 'malaria', 'complicated', 'lung', 'fractured', 'collar', 'bone', 'frailty', 'arthritis', 'failing', 'eyesight', 'stopped', 'travels', 'mingle', 'desperate', 'agnes', 'goinxha', 'bejaxhiu', 'serbia', '1910', 'deeply', 'religious', 'loretto', 'hoping', 'abbey', 'begin', 'novitiate', 'teach', 'geography', 'convent', 'divine', '1946', 'interviewer', 'belonged', 'approved', 'training', 'slum', 'therese', 'jesus', 'simply', 'dying', 'hindu', 'rest', 'penniless', 'nirmal', 'hriday', 'chain', '150', 'homes', 'destitute', 'admitting', '18,000', 'founded', 'documentary', 'mixture', 'hyperbole', 'credulity', 'catholics', 'focus-news', 'forecasts', 'alien-led', 'boost', 'bernard', 'hickey', 'baron', 'rupert', 'murdoch', 'ltd', '1995/96', 'profits', 'film', '1996/97', 'perspective', 'begun', 'promise', 'motion', 'picture', 'announcing', 'moderating', 'solid', 'orders', 'advertising', 'broadcasting', 'budgeted', 'attainable', 'soothed', 'pre-abnormals', 'a$', '1.26', 'us$', '995', 'cents', '1.343', 'disappointing', 'lachlan', 'drummond', 'offset', 'divisions', 'hefty', 'asian', 'operations', 'newsprint', 'hard', 'throughout', 'cover', 'revenues', 'surprises', 'inserts', 'guide', 'dramatically', 'arm', 'harper-collins', 'healthy', 'operation', 'demise', 'hurt', 'minimum', 'setting', 'expired', 'publishers', 'pulled', 'spotlight', 'understatement', \"'re\", 'internal', 'declined', '6.39', '2.00', 'p.m.', '0400', 'soft', '0.79', '373-1800', 'savings', 'rba', 'slash', 'useful', 'contribution', 'realised', 'raising', 'consolidation', 'unduly', 'restrict', 'ambiguous', 'coalition', '5.65', 'pledged', '1998/99', '10.3', 'credible', 'rein', 'unsustainable', 'favourable', 'effects', 'activity', 'generally', 'long-term', 'saving', 'tending', 'promote', 'investment', 'lowering', 'bnz', 'nz', 'fixed', 'lending', 'wellington', 'cutting', '10.5', '10.75', '10.95', '11.25', 'responding', 'wholesale', '4734', '746', 'odv', 'nz$', '524', 'optimised', 'deprival', '524.2', '486.5', 'valuation', 'reflected', 'extensions', 'lifespan', 'consistent', 'approach', 'followed', 'preventative', 'equipment', 'upgrading', 'revaluation', 'undertaken', 'disclosure', 'requirements', 'commerce', 'thais', 'hunt', 'breaker', 'thailand', 'launched', 'manhunt', 'awaiting', 'drug', 'possession', 'westlake', 'victoria', 'sucessful', 'escape', 'klongprem', 'outskirts', 'massive', 'confident', 'vivit', 'chatuparisut', 'correction', 'trafficking', 'sawed', 'grill', 'cell', 'window', 'climbed', 'five-metre', '15-foot', 'rope', 'bed', 'corrections', 'probing', 'inmates', 'chained', 'prevent', 'breakouts', '266', 'westerners', 'tokyo', 'soir', 'parent', 'billions', 'yen', 'specified', 'actual', 'year-ago', '26.00', '26.70', '400', '329', '250', '84', '11.61', '3.92', 'ord', '10.00', 'specialised', 'manufacturer', 'wear', 'ka', 'wah', 'hk$', '43', 'frcd', 'floating', 'certificate', 'privately', 'placed', 'sole', 'arranger', 'hsbc', 'facility', 'tenor', 'pays', 'basis', 'clearing', 'moneymarkets', '852', '2847', '4039', 'bans', 'nitrofuran', 'usage', 'chicken', 'antibiotic', 'applications', 'believes', 'cancer', 'breeders', 'feedmillers', 'abide', 'respect', 'safety', 'chua', 'jui', 'meng', 'bernama', 'two-year', 'maximum', 'ringgit', '2000', 'indonesian', 'watch', 'jakarta', '**', 'involving', 'megawati', 'sukarnoputri', 'stationed', 'demonstrators', 'dow', '31.44', '5,689.82', 'three-session', 'streak', 'tobacco', 'beating', 'composite', '2.60', '0.48', '542.20', 'bargain-hunting', 'big-capitalised', 'secondliners', 'rupiah', '2,343.00', '43.50', 'trading', '2,342.75', 'packaging', 'super', 'indah', 'makmur', 'offer', 'pt', 'vdh', 'teguh', 'sakti', 'wholly-owned', 'subsidiary', 'singapore-listed', 'privately-owned', 'duta', 'obtaining', 'fresh', 'syndicated', 'loans', 'management', 'reshuffle', 'ciputra', 'build', 'property', 'projects', 'worth', 'surabaya', 'movements', 'indices*', 'exchanges', 'change', 'highs', 'lows', 'dates', 'japanese', 'pound', 'gold', 'bullion', 'closes', 'brackets', 'low', '5,710.53', '22.94', '5,778.00', '5,032.94', '3,907.5', '+16.4', '3,632.3', '21,228.80', '134.44', '22,666.80', '19,734.70', 'jun', 'mar', '2,555.16', '2.10', '2,583.49', '2,284.86', '2,020.82', '+3.06', '2,146.79', '1,897.85', 'apr', '2,292.9', '+18.3', '2,326.00', '2,096.10', '11,424.64', '54.13', '11,594.99', '10,204.87', 'feb', '1.4871', '1.4935', '....', '108.50', '108.43', '1.5520', '1.5497', 'ounce', '387.50', '386.95', '*indices', 'all-time', '22/96', 'ftse-100', '23/96', 'nikkei', '38,915.87', 'dec', '29/89', 'dax-3o', '5/96', 'cac-40', '2,355.93', '2/94', 'all-ordinaries', '2,340.6', '3/94', 'hang', 'seng', '12,201.09', '4/94', 'hails', 'marks', 'rostislav', 'khotin', 'kiev', 'celebrates', 'hailing', 'inter-ethnic', 'post-soviet', 'achievement', 'declaration', 'nine-to-one', 'effectively', 'blow', 'soviet', 'empire', 'centuries', 'largest', 'republics', 'tajikistan', 'achievements', 'preservation', 'harmony', 'leonid', 'kuchma', 'televised', 'unlike', 'situations', 'peaceful', 'civilised', 'initially', 'accompanied', 'hyper-inflation', 'collapse', 'turnaround', 'inflation', 'hyper-inflationary', '10,300', 'respectable', 'economy', 'grow', 'solemn', 'ukraina', 'palace', 'turning', 'reforms', 'doubt', 'adelbert', 'knobl', 'monetary', 'fund', 'proud', 'much-postponed', 'hryvna', 'replace', 'karbovanets', 'rouble', 'trades', '33', 'introduce', 'postpone', 'promptly', 'nato', 'policy', 'wrangle', 'offending', 'unofficial', 'top-level', 'delegation', 'protest', 'hennady', 'udovenko', 'overreacting', 'seeing', 'itself', 'westernising', 'strategic', 'aim', 'integration', 'economically', 'oriented', 'though', 'circles', 'push', 'membership', 'associate', 'grouping', 'closer', 'congratulated', 'anniversary', 'promising', 'stabilising', 'factor', 'oldest', 'disappears', '16th-century', 'earliest', 'complete', 'example', 'disappeared', 'archives', 'gazeta', 'shqiptare', 'mass', 'gjon', 'buzuku', 'dating', '1555', 'discovered', '1740', 'seminary', 'published', 'language', 'albanians', 'sons', 'lamented', 'musa', 'hamiti', 'library', 'grateful', 'civilisation', 'inventing', 'photocopies', 'clamp', 'barter', 'keen', 'adopt', 'concerned', 'viewing', 'disguised', 'volkova', 'exported', 'unimported', '1.10', '4.9', '61.5', 'understated', 'decree', 'substantially', 'situation', 'traders', 'obliged', '180', 'fines', 'understating', 'loophole', 'tackling', 'technicalities', 'feature', 'decrees', 'liberalising', '1991-1992', 'impetus', '25-30', 'popped', 'preferred', 'reliable', 'transfer', 'systems', 'various', 'sorts', 'tranfers', 'incompetent', 'experienced', 'ones', 'dmitry', 'solovyov', '+7095', '941', '8520', 'viacom', 'sequel', 'paramount', 'pictures', 'cruise', 'blockbuster', 'release', 'variety', 'big-screen', 'version', 'spy', 'grossed', '175', 'domestically', '338', 'inc-owned', 'forrest', 'gump', 'plot', 'reprise', 'roles', 'co-producer', 'academy', 'award-winning', 'screenwriter', 'goldman', 'write', 'script', 'brian', 'palma', 'crack', 'oscars', 'butch', 'cassidy', 'sundance', 'kid', 'criticised', 'blockbusters', 'singled', 'entertaining', 'movie', 'sit', 'batsman', 'endure', 'frustrating', 'delay', 'resuming', 'quest', 'maiden', 'century', 'heavy', 'rain', 'drizzle', 'improvement', 'weather', 'umpires', 'announce', '1415', '1315', 'event', 'unbeaten', 'spotted', 'strumming', 'dressing-room', 'damp', 'patches', 'outfield', 'raining', '1230', '1130', 'brighter', 'bowled', '1900', '1800', 'practice', 'spa-francorchamps', 'gerhard', 'berger', 'benetton', '53.706', 'seconds', 'coulthard', 'mclaren', '1:54.342', 'jacques', 'villeneuve', '1:54.443', 'mika', 'hakkinen', '1:54.754', 'heinz-harald', 'frentzen', '1:54.984', 'jean', 'alesi', '1:55.101', 'damon', 'hill', '1:55.281', 'schumacher', '1:55.333', 'brundle', '1:55.385', 'rubens', 'barrichello', '1:55.645', '11.', 'herbert', 'sauber', '1:56.318', '12.', 'olivier', 'panis', 'ligier', '1:56.417', '[', 'corrected', '05:30', ']', 'gabriela', 'sabatini', 'asa', 'carlsson', 'katarina', 'studenikova', 'karina', 'habsudova', 'corrects', 'portsmouth', 'tranmere', 'grimsby', 'stirling', 'albion', '298-6', 'harden', '194-0', 'gooch', '105', 'robinson', '255-3', 'hooper', '389', 'penberthy', '4-36', '160-4', 'k.', 'curran', '310', '83', 't.', 'munton', 'illingworth', '4-54', 'lampitt', '4-90', '10-0', '529-8', '181', 'blakey', '109', '162-4', 'fairbrother', 'pollock', 'shaun', 'ankle', 'returns', 'swap', 'counties', 'premature', 'departure', 'unavoidable', '106', 'lb-12', 'nb-10', '7-283', '8-284', '9-295', '29.2-9-83-3', '25-6-95-4', '116', 'lb-1', 'wicket', '229', '1-106', '9-1-49-0', '9-3-28-0', '17-3-42-1', '7-1-38-0', '14-0-71-0', '4-95', 'ravanelli', 'shirt', 'dance', 'middlesbrough', 'italian', 'fabrizio', 'sponsor', 'seen', 'grey-haired', 'forward', 'pulls', 'shirtfront', 'salute', 'spectacle', 'celebrate', 'fun', 'besides', 'chest', 'aggravated', 'foot', 'chelsea', 'forest', 'bryan', 'robson', 'advance', 'aussies', 'reached', 'straight-set', 'victories', 'noteworthy', 'sixth-seeded', 'advanced', 'third-seeded', 'three-hour', 'eliminating', 'americans', 'overcame', '2-6', '12th-ranked', '70th-ranked', 'getting', 'handle', 'pretty', 'easily', '40s', 'things', 'missed', 'felt', '9:30', 'midnight', 'wake', 'routines', 'happier', 'person', '11th-ranked', 'aggressive', 'wind', 'affected', '26-year-old', 'atp', 'haven', '285th', 'hitting', 'ball', 'mental', 'letdowns', 'competing', 'lot', 'shots', 'marvelling', 'exciting', '64-stroke', 'joked', 'mostly', 'rugby', 'mulder', 'japie', 'pretoria', 'durban', 'spasms', 'fitness', 'check', 'springbok', 'teichmann', 'bruised', 'thigh', 'markgraaff', 'means', 'transvaal', 'snyman', 'cap', 'alongside', 'colleague', 'danie', 'schalkwyk', 'wing', 'pieter', 'hendriks', 'speculation', 'line-up', 'shortly', 'denote', 'seedings', 'ong', 'ewe', 'hock', '15-10', '15-5', 'ijaya', '5-4', 'gang', '15-9', 'chanda', 'rubin', '10th-ranked', '20-year-old', 'tendinitis', 'sidelined', 'misfortune', 'lucky', 'assignments', '17th-ranked', 'highest-ranked', 'non-seeded', 'player', 'moved', 'slot', 'notable', 'withdrawal', 'mary', 'pierce', '20th-ranked', 'meredith', 'mcgrath', 'becker', '.571', '.354', '.450', '.578', '.516', '.477', '.465', '47', '.627', '.540', '.406', '.531', '.528', '.425', '.432', 'doubleheader', 'sorrento', 'routs', 'oriole', 'moyer', 'tiring', 'routed', '10-3', '10-2', 'tagged', 'pair', 'devereaux', 'brady', 'anderson', 'walked', 'none', 'struck', 'norm', 'charlton', 'batters', 'seal', 'ken', 'griffey', 'jr', 'edgar', 'stroked', 'back-to-back', 'rocky', 'coppinger', 'jay', 'buhner', '7-0', 'advantage', 'fielder', 'touched', 'slams', 'wild-card', 'heading', 'pitches', 'dwell', 'troy', \"o'leary\", 'foul', 'pole', 'roger', 'clemens', '7-11', 'shutout', 'pinch-hitter', 'matt', 'stairs', 'tripled', 'tinsley', 'steinbach', 'dunked', 'broken-bat', '28-inning', 'longest', 'majors', 'pitched', 'reliever', 'acre', '0-1', 'garret', 'disarcina', 'apiece', 'edmonds', 'highlighted', 'six-run', 'coasted', '12-3', 'battered', 'rogers', 'outscored', '21-1', 'finley', '12-12', 'four-game', 'travis', 'fryman', 'doubled', 'go-ahead', 'melvin', 'nieves', 'damion', 'easley', 'claimed', 'handing', 'halted', 'seven-game', 'thompson', 'belcher', '12-8', 'en', 'route', 'red-hot', 'contests', '14-7', 'yielded', 'covering', 'erik', 'hanson', 'outdueled', 'fernandez', 'jacob', 'brumfield', 'otis', 'blanked', 'shortened', '11-15', 'lisbon', 'luis', 'predrosa', 'cruised', '3-1', 'sc', 'espinho', 'drilled', 'right-foot', 'nail', 'besirovic', '35th', 'restored', 'vidigal', '38th', 'mustapha', 'hadji', '57th', 'reigning', 'porto', 'benfica', 'portuguese', 'pauli', 'fightback', 'tipped', 'candidates', 'relegation', 'produced', 'second-half', '4-4', 'bundesliga', 'schalke', 'raced', 'trulsen', 'two-goal', 'cushion', 'afterwards', 'springer', '64th', 'thanks', 'sabotzik', 'hansa', 'rostock', 'karsten', 'baeron', 'dazzling', 'build-up', 'in-form', 'harald', 'spoerl', 'salah', 'hissou', 'clocked', '38.08', '26:43.53', 'haile', 'gebreselassie', 'hengelo', 'summaries', 'min', '18,500', 'driller', 'sobotzik', 'thon', '34th', 'wilmots', '1-3', '19,775', 'nancy', 'germain', '15,000', 'masterkova', 'warner', 'svetlana', 'smashed', 'bettered', 'mile', 'zurich', '28.98', 'ate', 'swift', 'lap', 'shave', '0.36', '2:29.34', 'mozambique', 'mutola', 'stadium', 'pushed', 'finishing', '2:29.66', 'bonus', 'historic', 'capacity', 'dominated', 'middle-distance', 'races', 'three-year', 'maternity', 'richest', 'slashed', '3.05', '12.56', 'plus', 'kilo', '100,000', 'fortnight', 'laid', 'comparable', 'surface', 'softer', 'enjoyed', 'gear', 'strides', 'pointing', 'clock', 'delight', 'crossed', 'evolution', 'tabulated', '2:30.67', 'wachtel', '17.8.90', '25.8.95', '2:28.98', '23.8.96', '28.99', 'adjusted', '128', '129', '130', '131', '132', 'borrego', '133', 'willison', 'ames', 'trinidad', 'tobago', '134', 'coles', 'chapman', 'cea', '135', 'mason', 'barry', 'lane', 'webster', 'mitchell', 'upstages', 'trio', 'dennis', 'upstaged', 'present', 'storming', 'customary', 'bright', 'outfit', '10.03', 'scalp', 'donovan', 'bailey', 'linford', 'christie', '1988', 'lucrative', 'blocks', 'burst', 'celebration', '10.09', '10.10', 'bronze', 'medallist', 'ato', 'boldon', '10.12', '10.14', 'limp', 'hurdles', 'allen', 'defied', 'brilliant', '12.92', '0.01', 'colin', 'jackson', 'fastest', 'hurdler', 'seemed', 'relish', 'dominating', 'finish', 'faster', 'speed', '13.24', 'pelting', 'hurdlers', 'stepped', 'ludmila', 'engquist', 'crashed', 'hurdle', 'footing', '12.60', 'silver', 'brigita', 'bukovec', '12.95', 'jamaican', 'michelle', 'freeman', '12.77', 'cuban', 'aliuska', 'lopez', 'jackpot', 'one-kg', 'clinch', 'golden', 'penultimate', 'adkins', 'alive', '47.93', 'gail', 'devers', '10.84', '0.10', 'merlene', 'ottey', 'medal', 'photo', 'settle', '11.04', 'gwen', 'torrence', '11.00', 'costly', 'discus', 'ilke', 'wyludda', '66.60', 'ellina', '65.66', 'franka', 'dietzsch', '61.74', 'natalya', 'sadova', '61.64', 'mette', 'bergmann', '61.44', 'nicoleta', 'grasu', '61.36', 'olga', 'chernyavskaya', '60.46', 'irina', 'yatchenko', '58.92', 'jamaica', 'cuba', '12.85', 'dionne', '12.88', 'yulia', 'graudin', '12.96', 'julie', 'baumann', '13.36', 'girard-leno', 'dawn', 'bowles', '13.53', 'emilio', 'valle', '13.33', 'pieters', '13.37', '13.38', 'asselman', '13.64', 'hubert', 'grossard', '13.65', \"n'senga\", '13.66', 'johan', 'lisabeth', '13.75', 'roberta', 'brunet', '48.96', 'fernanda', 'ribeiro', '14:49.81', 'sally', 'barsosio', 'kenya', '14:58.29', 'paula', 'radcliffe', '14:59.70', 'julia', 'vaquero', '15:04.94', 'catherine', 'mckiernan', '15:07.57', 'annette', 'peters', '15:07.85', 'pauline', 'konga', '15:11.40', 'davidson', 'ezinwa', 'nigeria', '10.15', 'jon', '10.16', 'bruny', 'surin', '10.30', 'samuel', 'matete', 'zambia', '47.99', 'rohan', '48.86', 'torrance', 'zellner', '49.06', 'jean-paul', 'bruwier', '49.24', 'dusan', 'kovacs', '49.31', 'calvin', '49.49', 'laurent', 'ottoz', '49.61', 'dollendorf', '50.36', 'onyali', '11.09', 'chryste', 'gaines', '11.18', 'zhanna', 'pintusevich', '11.27', 'privalova', '11.28', 'natalia', 'voronova', 'juliet', 'cuthbert', '11.31', 'regina', '01.77', 'djate', '4:02.26', 'carla', 'sacramento', '4:02.67', 'yekaterina', 'podkopayeva', '4:04.78', 'margret', 'crowley', '4:05.00', 'leah', 'pells', '4:05.64', 'sarah', 'thorsett', '4:06.80', 'sinead', 'delahunty', '4:07.27', 'steeplechase', 'joseph', 'keter', '10.02', 'sang', '8:12.04', 'moses', 'kiptanui', '8:12.65', 'gideon', 'chirchir', '8:15.69', 'kosgei', '8:16.80', 'larbi', 'khattabi', '8:17.29', 'eliud', 'barngetuny', '8:17.66', 'barmasai', '8:17.94', '44.29', 'mills', '44.78', 'anthuan', 'maybank', '44.92', 'kamoga', 'uganda', '44.96', 'baulch', '45.08', 'bada', '45.21', 'samson', 'kitur', '45.34', 'richardson', '45.67', 'rouser', '46.11', 'frankie', 'fredericks', 'namibia', '19.92', '19.99', '20.21', '20.42', 'stevens', '20.43', 'garcia', '20.45', 'eric', 'wymeersch', '20.84', 'lamont', '21.08', 'malgorzata', 'rydz', '2:39.00', 'anja', 'smolders', '2:43.06', 'veerle', 'jaeghere', '2:43.18', 'eleonora', 'berlanda', '2:43.44', 'anneke', 'matthijs', '2:43.82', 'jacqueline', '2:44.22', '22.42', 'inger', '22.66', '22.68', '22.73', 'trandenkova', '22.84', 'chandra', 'sturrup', '22.85', 'zundra', 'feagin', '23.18', 'galina', 'malchugina', '23.25', 'cathy', '49.48', 'marie-jose', 'perec', '49.72', 'falilat', 'ogunkoya', '49.97', '50.14', 'fatima', 'yussuf', 'maicel', 'malone', '50.51', 'hana', 'benesova', '51.71', 'ann', 'mercken', '53.55', 'komen', '25.87', 'khalid', 'boulami', '7:31.65', 'bob', '7:31.69', 'hassane', 'lahssini', '7:32.44', 'nyariki', '7:35.56', 'noureddine', 'morceli', '7:36.81', 'fita', 'bayesa', '7:38.09', 'keino', '7:38.88', 'lars', 'riedel', '66.74', '66.72', 'dubrovshchik', '64.02', 'virgilius', 'alekna', '63.62', 'juergen', 'schult', '63.48', 'vassiliy', 'kaptyukh', '61.80', 'vaclavas', 'kidikas', '60.92', 'mollenbeck', '59.24', 'triple', 'jump', 'edwards', '17.50', 'yoelvis', 'quesada', '17.29', 'wellman', 'bermuda', '17.05', 'harrison', '16.97', 'markov', '16.66', 'francis', 'agyepong', '16.63', 'rogel', 'nachum', '16.36', 'sigurd', 'njerve', '16.35', 'guerrouj', '29.05', 'isaac', 'viciosa', '3:33.00', 'tanui', '3:33.36', 'elijah', '3:33.64', \"o'sullivan\", '3:33.77', 'mayock', '3:33.94', 'laban', 'rotich', '3:34.12', 'impens', '3:34.13', 'stefka', 'kostadinova', '2.03', 'inga', 'babakova', 'alina', 'astafei', '1.97', 'motkova', '1.94', 'zalevskaya', 'kazakhstan', '1.91', 'yelena', 'gulyayeva', '1.88', 'hanna', 'haugland', 'boshova', '1.85', 'nele', 'zilinskiene', 'tergat', '26:54.41', 'koech', '26:56.78', 'kiptum', '27:18.84', 'aloys', 'nizigama', 'burundi', '27:25.13', 'mathias', 'ntawulikura', 'rwanda', '27:25.48', 'abel', 'anton', '28:18.44', 'kamiel', 'maase', '28.29.42', 'worku', 'bekila', '28.42.23', 'stefko', '28:42.26', '18-man', 'paulo', 'sousa', 'juventus', 'member', 'oliveira', 'coaches', 'vitor', 'baia', 'rui', 'correia', 'paulinho', 'santos', 'helder', 'cristovao', 'secretario', 'dimas', 'teixeira', 'couto', 'barroso', 'figo', 'barros', 'oceano', 'cruz', 'ricardo', 'pinto', 'forwards', 'domingos', 'joao', 'vieira', 'cadete', 'folha', 'vogts', 'keeps', 'faith', 'berti', 'entire', 'friendly', 'zabrze', 'nominated', 'veterans', 'jens', 'todt', 'dispensation', 'libero', 'matthias', 'sammer', 'steffen', 'freund', 'defender', 'rene', 'schneider', 'formally', \"'ll\", 'themselves', 'oliver', 'kahn', 'koepke', 'reck', 'markus', 'babbel', 'helmer', 'kohler', 'mario', 'basler', 'bode', 'dieter', 'eilts', 'haessler', 'moeller', 'mehmet', 'scholl', 'strunz', 'ziege', 'bierhoff', 'fredi', 'bobic', 'klinsmann', 'kuntz', 'draws', 'olympiakos', 'pao', 'x-aek', 'x-olympiakos', 'x-pao', 'legia', 'warsaw', 'x', 'indicates', 'competitions', 'lyngby', 'x-club', 'brugge', 'casino', 'graz', 'ekeren', 'besiktas', 'molenbeek', 'alania', 'vladikavkaz', 'x-anderlecht', 'x-cercle', 'healed', 'lankans', 'acrimonious', 'guilty', 'tampering', 'off-spinner', 'muttiah', 'muralitharan', 'throwing', 'controversial', 'three-test', 'proper', 'arjuna', 'ranatunga', 'eve', 'warmup', 'xi', 'cam', 'battersby', 'excellent', 'batterby', 'lankan', 'wicketkeeper', 'healy', 'angola', 'luanda', 'angolan', 'jornal', 'proposing', 'definite', 'unita', 'generals', 'formation', 'unity', 'reconciliation', 'circulation', 'peoples', 'guaranteed', 'installed', 'deputies', 'occupy', 'delays', 'occupation', 'demilitarised', 'substituted', 'so-called', 'dos', 'proposes', 'definitive', 'timetable', 'tasks', 'obligations', 'lusaka', 'sending', 'supervise', 'execution', 's.african', 'consensus', 'day--company----period--consensus----range-------pvs', 'mon', 'gencor', '93.12', '92.0-94.5', '73.8', '25.75', '25.0-27.0', '20.0', 'primedia', 'n', '149.1', '123.2', 'distillers', '71.8', '49.0', 'tue', 'iscor', '29.7', '26.0-32.0', '38.0', '15.0', '14.5-16.5', '16.5', 'mccarthy', '125.3', '112.0-149.0', '93.2', '36.8', '32.0-43.0', '28.0', 'wed', 'imphold', '172.7', '170.4-175.0', '115.1', '67.5', '66.6-68.4', '45.0', 'thu', 'm&r', '113.0', '112.1-113.4', '126.0', '31.7', '10.5-42.3', '47.0', 'jd', '143.7', '138.0-149.0', '111.2', '41.8', '41.0-42.5', '33.0', 'oooooo', '+27', '482', '1003', 'ulster', 'petroleums', 'falls', 'calgary', 'shr', '0.04', '0.08', '1,196', '2,232', '0.39', '0.41', 'revs', '20,167', '18,623', '0.12', '0.15', '3,674', '4,271', '0.86', '0.81', '41,752', '35,711', '000s', '416', '941-8100', 'jeopardize', 'trip-canada', 'ottawa', 'restrictions', 'axworthy', 'circumstances', 'discuss', 'mid-tier', 'golds', 'fever', 'handful', 'toronto-based', 'tvx', '0.30', '11.55', '780,000', 'kinross', '0.25', '720,000', 'scorpion', 'minerals', 'junior', 'exploration', 'properties', '0.50', '120,000', 'changing', 'hands', 'eyebrows', 'aware', 'developments', 'formed', 'unitog', 'upgraded', 'barrington', 'associates', 'near-term', 'buffett', 'stake', 'omaha', 'billionaire', 'warren', 'trust', '8.0', '6.7', 'filing', 'securities', 'exchnage', '62,900', 'boston-based', 'estate', 'ranging', '7.65', 'holding', '725,900', 'purchased', '6.2', 'well-known', 'investor', 'berkshire', 'hathaway', 'holds', 'investments', 'large', 'reach', 'miami', 'allow', 'amr', 'airlines', 'operate', 'round-trip', 'transportation', 'shift', 'designate', 'all-cargo', 'permitted', 'category', 'conditional', 'routes', '2-1/2', 'resolved', 'arose', 'colombians', 'propose', 'avianca', 'clean', 'tanker', 'fixtures', 'enquiries', '1754', 'mideast', 'konpolis', '1/9', 'w112.5', 'kpc', 'tbn', '6/9', 'w.c.', 'w200', 'e.c.india', 'w195', 'ioc', 'asia', 'petrobulk', 'rainbow', '24/8', 'okinawa', 'inchon', '190,000', 'honam', 'med', '15/9', 'constanza', 'inia', '700,000', 'cont', '36,5', '3/9', 'pembroke', 'w145', 'stentex', 'hemisphere', 'kpaitan', 'stankov', '31/8', 'croix', 'usac', 'w125', 'hess', 'ap', 'moller', 'caribs', '875,000', 'tiber', '2/9', 'options', 'w265', 'stinnes', '------------------------------------------------------------', 'tenacity', '24/08', 'samsung', 'sks', 'tana', '03/09', 'cnr', 'northsea', 'chaser', '12/09', 'w167.5', 'jomo', 'sibonina', '13/09', 'w160', 'marubeni', 'neptune', 'crux', '02/09', 'singapore', '185,000', 'sietco', 'rnr', 'fulmar', '28/08', 'yosu', '105,000', 'lg', 'caltex', 'hemina', '05/09', 'eleusis', 'ukcm', 'w155', '8980', '229-1', 'sacks', 'golfer', 'sacked', 'harmon', 'ways', 'long-time', 'mentor', 'drawing', 'blank', 'tournaments', 'blonde', 'adrift', 'tanaki', 'worst', 'circuit', 'application', 'strange', 'keyed', 'your', 'perform', 'ori', 'taibe', 'fields', 'arabs', '1961', 'loyal', '28,000', 'unfriendly', 'crowds', 'taunt', 'thing', 'promoted', 'betar', 'supporter', 'karem', 'haj', 'yihye', 'coached', 'wojtek', 'lazarek', 'closely', 'chants', 'bottle-throwing', 'marred', 'goalless', 'treatment', 'stone', 'driving', 'hearing', 'taunts', 'sameh', 'resident', 'hebrew', 'words', 'nobody', 'vehemently', 'dusty', 'lacks', 'amenities', 'communities', 'discrimination', 'parks', 'empty', 'load', 'tel', 'aviv', 'ramshackle', '2,500-seat', 'accessible', 'dirt', 'tracks', '10,000-seat', 'situated', 'elsewhere', 'rahman', 'mayor', 'hopefully', 'refurbished', 'meantime', 'policed', 'coastal', 'netanya', 'israelis', 'waiter', 'represents', 'phelan', 'withdrawn', 'liechenstein', 'f.a.i.', 'liverpool', 'replacements', 'damien', 'lynch', '+353', '6603377', 'pitted', 'hopefuls', 'runners-up', 'rapid', 'fenerbahce', 'turin', 'trafford', '1990s', 'consistently', 'crashing', 'barcelona', 'trophy', 'triumph', '1968', 'wembley', 'conquering', 'ill-fated', '1985', 'heysel', 'robbery', 'suspects', 'lagos', 'sokoto', 'nan', 'umar', 'stealing', '800,000', 'naira', 'merchant', 'rwandan', 'expulsion', 'imminent', 'nairobi', 'repatriation', '1.1', 'hutu', 'zaire', 'lobby', 'innocent', 'butare', 'democracy', 'rdr', 'hutus', 'appealed', 'deter', 'termed', 'inhuman', 'orthodox', 'blown', 'zagreb', 'saboteurs', 'serb', 'damaged', 'hina', 'karin', 'gornji', 'zadar', 'destroyed', 'casualties', 'find', 'perpetrators', 'hinterland', 'serbs', 'yugoslav', 'self-styled', 'krajina', 'proclaimed', 'minority', 'recaptured', '200,000', 'vacant', 'depopulated', '27.53', '27.25', '27,535.5', 'reserves', '13,256.5', '12,855.7', '14,278.9', '9,510.9', '10,056.4', 'tighten', 'crime', 'organised', 'pap', 'zbigniew', 'siemiatkowski', 'schmidbauer', 'co-ordinator', 'helmut', 'kohl', 'chancellery', 'sealed', 'links', 'ryszard', 'hincza', 'mafia-style', 'smuggling', 'radioactive', 'materials', 'chechens', 'observing', 'fighters', 'soldiers', 'effective', 'gunfire', 'echoed', 'withdraw', 'rebel-dominated', 'mountains', 'relatively', 'shabazov', 'bearded', 'wearing', 't-shirt', 'camoflage', 'trousers', 'rocked', 'courtyard', 't-72', 'tank', 'roared', 'swept', 'checkpoints', 'roads', 'soldier', 'goncharova', 'dark', 'hair', 'poking', 'peaked', 'camouflage', 'overhead', 'flares', 'patrols', 'sceptical', 'try', 'cis', 'closures', 'independent', 'granic', 'croatia-yugoslavia', 'poised', 'landmark', 'normalisation', 'paving', 'stabilisation', 'balkans', 'mate', 'aboard', 'jet', 'counterparts', '1000', 'endorsed', 'normalising', 'tanjug', 'assessed', 'crucial', 'resolving', 'ensuring', 'restoration', 'last-minute', 'print', 'internationally', 'recognised', 'borders', 'diplomats', 'secession', 'powers', 'regard', 'twin', 'pillars', 'multinational', 'lasting', 'quito', 'abdala', 'bucaram', 'lunches', 'presidential', 'different', 'blacks', 'mixed-bloods', 'exclusively', 'potentates', 'ambassadors', 'protocol', 'mixed-race', 'peasant', 'sectors', 'elected', 'populist', 'platform', 'cultures', 'andean', 'nation', 'indigenous', 'hovercrafts', 'amazon', 'brasilia', 'plying', 'waters', 'bid', 'difficulties', 'vast', 'waterway', 'russian-built', 'capable', 'tons', 'ferrying', 'huge', 'river', 'belem', 'riverways', 'high-speed', 'hovercraft', 'hk', 'tsang', 'donald', 'suharto', \"mar'ie\", 'muhammad', 'ali', 'alatas', 'tungky', 'ariwibowo', 'bolger', 'don', 'mckinnon', 'birch', 'expels', 'bread', 'riots', 'rana', 'sabbagh', 'passed', 'peacefully', 'demonstrations', 'adel', 'ibrahim', 'attache', 'duties', 'incompatible', 'norms', 'implying', 'spying', 'notified', 'explusion', 'assistant', 'khalaf', 'expelled', 'king', 'defections', 'retaliated', 'expelling', 'jordanian', 'secure', 'pro-baghdad', 'karak', 'flared', 'hundred', 'lingered', 'omari', 'mosque', 'shouting', 'disperse', 'abstain', 'forming', 'enforced', 'loose', 'curfew', 'loudspeakers', 'allahu', 'akbar', 'islamist', 'kafawin', 'pulpit', 'detainees', 'houses', 'cancelling', 'armoured', 'streets', 'traditional', 'bastion', 'communist', 'ideology', 'baath', 'socialism', '1950s', 'guarded', 'entrances', 'hill-top', 'famed', 'crusader', 'castle', 'crowded', 'smaller', 'quietly', 'riot', '80-seat', 'involvement', 'policies', 'hardship', 'rioting', 'derision', 'blame', 'protests', 'hardships', 'kurd', 'ankara', 'anatolian', 'state-paid', 'pkk', 'sirnak', 'hakkari', '12-year-old', 'autonomy', 'southeastern', 'planted', 'exploded', 'fights', 'diyarbakir', 'u.s.-mediated', 'glyn', 'davies', 'contacts', 'barzani', 'jalal', 'talabani', 'implementation', 'pelletreau', 'solidify', 'cease-fire', 'pursue', 'repelled', 'wounding', 'capturing', 'opposing', 'unite', 'mountainous', 'slumber', 'chesapeake', 'knife-wielding', 'neighbour', 'apparently', 'intent', 'sexual', 'invaded', 'teenage', 'a.m.', 'edt', 'teenaged', 'girls', 'camelot', 'subdivision', 'virginia', 'entered', 'wielding', 'knife', 'sexually', 'detective', 'curtis', 'ii', 'adults', 'sketchy', 'teenagers', 'reportedly', 'downstairs', 'watching', 'allegedly', 'teenager', 'sleeping', 'upstairs', 'commotion', 'confronted', 'stabbed', 'once', 'assailant', 'fatally', 'molested', 'life-threatening', 'identified', 'harper', 'glickman', 'usda', 'monitoring', 'aflatoxin', 'dan', 'corn', 'usda-sponsored', 'perennial', 'problematic', 'vomitoxin', 'purchase', 'wheat', 'republican', 'weld', 'senate', 'franny', 'incumbent', 'sen', 'kerry', 'vote', 'wbur-fm', 'facing', 'cambridge', 'friend', 'tracy', 'roosevelt', 'politics', 'great-granddaughter', 'franklin', 'roosevelts', 'friends', 'susan', 'descendant', 'theodore', 'lufthansa', '1.7', 'in-house', 'lufthanseat', 'freight-tonne', 'kilometres', '2,389', '1,600', 'freight', '67.0', 'transport', 'dm', '820', 'flight-related', '125', 'wsc-india', 'summary-', 'showers', '0.25-1.30', 'inch', '6-33', 'mm', 'locally', 'coverage', 'isolated', '0.20-0.70', '5-18', '82-96f', '28-36c', 'crop', 'impact-', 'forecast-', '0.25-1.00', '6-25', '0.75', 'tonight', 'variable', 'clouds', 'cloudy', '68-76f', '20-24c', 'thunderstorms', 'temperatures', 'corporation', 'curb', 'tamil', 'stamp', 'soil', 'directed', 'sympathised', 'predicament', 'prevailing', 'framework', 'perpetrate', 'coordinator', 'counter', 'terrorism', 'wilcox', '13-year', 'extorted', 'expatriate', 'liberation', 'eelam', 'leaves', 'week-long', 'kathmandu', 'birendra', 'ascending', 'throne', '1972', 'constitutional', 'monarch', 'jiang', 'zemin', 'peng', 'prakash', 'lohani', 'himalayan', 'sandwiched', 'traditionally', 'giant', 'neighbours', 'distance', '50-year', 'queen', 'aishwarya', 'tibetan', 'lhasa', 'chongqing', 'servant', 'nepali', 'bound', 'employer', 'madhusudan', 'munakarmi', 'informed', 'plight', '12-year', 'dhiraj', 'k.c.', 'locks', 'concealed', 'dheeraj', 'employed', 'limping', 'steal', 'belongings', 'vols', 'regrouping', 'implied', 'volatility', 'stabilise', 'falling', 'german-led', 'euromark', 'trader', '14.00', '16.75', '19.50', '21.25', 'welter', '18.50', '20.00', '22.00', '23.5', '1347', '96.78', 'sell-off', 'overdone', 'floors', 'size', 'bundesbank', 'repo', '3.00', '3.30', 'longer-dated', 'short-dated', 'vol', 'historically', 'vol.', 'reassess', 'otc', 'specialist', 'coughlan', 'over-the-counter', '10-year', 'bunds', 'makers', 'high-yielding', 'downside', 'upside', 'potential', 'recommend', 'strangles', 'particular', 'vulnerable', 'fronts', 'enhance', 'yield', 'nisbet', 'bonds', '6320', 'sachs', 'warrants', 'continental', 'wertpapier', 'american-style', 'warrant', 'controls', '25.00', 'dem', 'premium', '2.42', 'gearing', '10.29', '02.sep.96-21.nov.97', 'paydate', '30.aug.96', 'ddf', 'fft', 'stg', 'exer', '24.90', 'challenge', 'diana', 'photographer', 'branded', 'stalker', 'princess', 'approaching', 'stenning', '12-week', 'contest', 'injunction', 'obtained', 'affidavit', 'affadavit', 'benedict', 'birnberg', 'everything', 'ice', 'brick', 'driver', 'motorcycle', 'dispatch', 'rider', 'convictions', 'magistrates', 'compensation', '182', '282', 'freelance', 'divorce', 'heir-to-the-throne', 'prince', 'charles', 'persistently', 'trailing', 'chasing', 'remove', 'camera', 'scapegoat', 'photographers', 'mr.', 'shook', 'dohuk', 'tentative', '...for', 'sake', 'asking', 'riza', 'altun', 'accompany', 'frequent', 'cross-border', 'drives', 'writer', 'nacar', 'wider', 'effort', 'necmettin', 'erbakan', 'encouraged', 'uses', 'solidere', 'privately-operated', 'secondary', 'bsm', 'distributed', 'rebuilding', '104.625', '650-million', 'subscription', '106.5', '106.375', '8,049', '8,757', '850,968', '918,288', '1,185', 'ciments', 'libanais', '1.1875', '2,036', 'listed', 'blancs', 'eternit', 'uniceramic', 'blom', 'covers', '903.09', 'lispi', '0.02', '81.58', 'editorial', '961', '864148', '353078', '861723', 'zenith', 'lands', 'plant', 'nadeau', 'consortium', 'walt', 'disney', 'digital', 'televison', 'set-top', 'boxes', 'entertainment', 'struggled', 'luehrs', 'glenview', 'ill.-based', 'networks', 'anytime', 'somebody', 'gets', 'soared', '5.50', '16.875', 'americast', 'develop', 'generation', 'addition', 'partners', 'phone', 'ameritech', 'corp.', 'bellsouth', 'gte', 'sbc', 'communications', 'telecommunications', 'join', 'cable', 'woodridge', 'ill', 'tubes', '32-', '35-inch', 'screen', 'buys', 'competitors', 'jobs', 'roll', 'build-to-order', 'convert', 'chihuahua', 'analogue', 'manufacture', 'profitable', 'subscribers', 'technology', 'retail', 'electronics', 'devices', 'dividends', 'plagued', 'colour', 'reporting', 'full-year', '33.2', '45.3', '97', 'korea-based', 'gutenstein', 'kalf', 'voorhis', 'unique', 'happy', 'natural', 'meditate', 'hundreds', 'yogic', 'fliers', 'defy', 'nature', 'levitating', 'comes', 'minor', 'candidate', 'transcendental', 'meditation', 'tm', 'physicist', 'hagelin', 'nov.', 'running', 'claiming', 'ward', 'techniques', 'stress', 'automatically', 'decrease', 'practitioners', 'involves', 'meditating', 'repeated', 'word', 'phrase', 'mantra', 'followers', 'contend', 'mediate', 'demonstration', 'bouncing', 'sitting', 'windows', 'fail', 'wolk', 'massively', 'publicized', 'introduction', 'microsoft', 'computer', 'fallen', 'fastest-selling', 'unprecedented', 'hype', 'aug.', 'launch', 'greet', 'lines', 'customers', 'redmond', 'wash.-based', 'tens', 'dollars', 'promoting', 'stunts', 'lighting', 'building', 'color', 'scheme', 'rob', 'enderle', 'giga', 'hardware', 'spike', 'materialized', 'expecting', 'coat-tails', 'somewhat', 'winkler', 'gartner', 'impact', 'earth-shattering', 'symantec', 'posting', 'projections', 'touchstone', '1.3', 'lawsuit', 'tied', 'developers', 'suffer', 'shelves', 'jammed', 'blue-and-white', 'resulting', 'shortage', 'space', 'seasonal', 'stephens', 'pc', 'accompanying', 'upgrade', '8.67', 'cemented', 'dominant', 'executives', 'thrilled', 'sometime', 'surpass', 'older', 'computers', 'handling', 'technical', 'frustrated', 'install', 'corporate', 'adopted', 'go-slow', 'high-end', 'nt', 'downplayed', '4.0', 'proportion', 'users', 'mistake', 'thinking', 'sweeping', 'slow', 'migration', 'pacts', 'repatriate', 'intercepted', 'migrants', 'illegally', 'jeopardising', 'cubans', 'guantanamo', 'naval', 'enforcement', 'alien', 'hijackings', 'remind', 'everyone', 'abiding', 'avoiding', 'havana', 'centred', 'boatload', 'emigrants', 'capsized', 'sixteen', 'bay', 'emigrated', 'hijacking', 'hijackers', 'hijacked', 'commercial', 'aylum', 'wis', 'apply', 'welfare', 'pioneering', 'image', 'wisconsin', 'submit', 'administrative', 'tommy', 'submitted', 'reform', 'curve', 'dubbed', 'w-2', 'waivers', 'acquire', '60-day', 'residency', 'requirement', 'participation', 'collections', 'directly', 'custodial', 'eligibility', 'karen', 'pierog', '312-408-8647', 'snoozing', 'vietnamese', 'train', 'alaska', 'anchorage', 'snooze', 'boxcar', 'locked', 'whittier', 'tuan', 'quac', 'phan', 'dehydrated', 'famished', 'terrified', 'barge', 'sgt', 'jewell', 'cooperative', 'uniform', 'accidental', 'searching', 'fishing', 'sleep', 'coupled', 'transporting', 'lumber', 'sound', 'fed', 'soup', 'breakfast', 'agents', 'arkansas', 'fires', 'barnes', 'rock', 'ark', 'sifted', 'rubble', 'predominantly', 'churches', 'burned', 'mississippi', 'delta', 'kms', 'located', 'investigating', 'idea', 'arson', 'conclusively', 'established', 'f.b.i.', 'alcohol', 'firearms', 'scene', 'zion', 'baptist', 'st.', 'matthews', 'frame', 'structures', 'turner', 'surrounded', 'cotton', 'soybean', 'rural', 'surprised', 'fannie', 'matthew', 'connected', 'shared', 'suspicion', 'motive', 'spite', 'rev.', 'jerome', 'pastor', 'spared', 'wave', 'worship', 'camden', 'oak', 'initiated', 'everen', '0.13', '0.40', '0.43', 'simulated', 'models', 'discount', 'averages', 'short-term', 'objective', '1/16', '3-11/16', 'sungard', 'checkfree', 'mateo', 'calif.', 'shareholder', 'finalized', 'o', '212', '859-1610', 'alpha', 'techs', 'lockhart', 'technologies', '280,556', 'post-closing', 'adjustments', 'designer', 'sophisticated', 'thermal', 'ptt', 'telecoms', 'koninklijke', 'nederland', 'nv', 'marginally', 'scant', 'adjust', '1.209', 'breadth', '1.210-1.236', '1.210', 'largely', 'view', 'overwhelmingly', 'surprising', 'ing', 'steven', 'vrolijk', 'continuing', 'performer', 'sticking', '2.45', 'guilder', '2.26', '1403', '1.70', '61.00', 'weaker', 'bourse', 'keiron', 'henderson', 'boskalis', 'upgrades', '13:12', 'papendrecht', 'dredging', 'westminster', 'utilisation', 'dredger', 'uncertain', '70.9', 'prospects', 'first-half', '27.5', '41.4', 'dissolves', 'costis', 'stephnopoulos', 'ordering', 'dissolution', '300-seat', 'stephanopoulos', 'poll', 'citing', 'convergence', 'originally', 'libyan', 'amer', 'hishem', 'mohammed', 'pool', 'sliema', 'stab', 'wounds', 'grech', 'fervant', 'investigations', 'bahn', 'h1', 'pre-tax', '17.5', '188', '14,600', '3.3', 'state-owned', 'earmarked', 'eventual', 'privatisatio', 'fat8222', 'long-distance', 'traffic', '2,500', '6.4', 'commuter', '5,400', '4.6', '3,200', '5.1', 'workforce', '300,962', '3.7', 'oct', 'compare', 'compares', '+49', '756525', 'lion', 'paparazzi', 'tabs', 'whales', 'marine', 'biologists', 'lions', 'tag', 'photograph', 'elusive', 'depths', 'scientist', 'harvey', 'jennifer', 'hurley', 'moss', 'laboratories', 'companions', 'species', 'whale', 'diver', 'knows', '17-year-old', 'beaver', 'nine-year-old', 'undergone', 'amusement', 'accurately', 'transmitter', 'swim', 'mammals', 'filming', 'video', 'assignment', 'documenting', 'humpback', 'monterey', 'article', 'spell', 'exactly', 'taught', 'stick', 'plastic', 'model', 'using', 'suction', 'cups', 'jeopardises', 'howard', 'jeopardised', 'upper', 'scrutinise', 'hacks', 'hack', 'environment', 'function', 'warned', 'fiscally-tight', 'hampered', 'contained', 'sharp', 'spending', '5.6', 'partially', 'telstra', 'greens', 'labor', 'toyota', 'melbourne', '2,000', 'striking', 'voted', 'two-week', 'stoppage', 'niugini', 'surge', 'miner', 'surged', '38', '3.75', 'confirmation', 'mountain', 'considering', 'acquiring', '49.6', 'minorities', 'broker', 'copper', 'papua', '17.2', 'lihir', 'project', '0025', '3.65', '108,288', '9373', 'students', 'throw', 'irreplaceable', 'rocks', 'yonsei', 'samples', 'geology', 'collect', 'prefessors', 'collection', 'gathered', 'panes', 'desks', 'forever', 'professor', 'staged', 'violent', 'nine-day', 'unification', 'campus', 'unwinding', 'unwound', 'belief', 'strengthen', '818.10', '819.10', '817.60', '819.30', 'overbought', 'insistent', 'intervention', 'convinced', 'supporting', 'orii', '96/97', '8.70', 'prft', '371', 'nil', '447', '48.61', 'automation', '95/96', '9.33', '286', '48', '350', '38.11', 'diluted', 'lynne', \"o'donnell\", 'shanghai', 'bonded', 'warehouses', 'confounding', 'fate', 'belongs', 'yingkou', 'stockpile', 'stored', 'guessing', 'metal', 'channelled', 'nonferrous', 'metals', 'cniec', 'indication', 'administered', 'value-added', 'prohibitively', 'otherwise', 'spend', 'moving', 'mystery', 'unsure', 'exact', 'cost-effective', 'depleted', 'purpose', 'backwardation', 'lme', 'occurs', 'lent', '85,000', 'behalf', '115,000', '2,700', 'tonne', 'somewhere', '2,200', 'storage', 'secret', 'unnerved', 'jittery', 'bloomsbury', 'economics', 'bme', 'motivation', 'owners', 'fundamental', 'rumours', 'sumitomo', 'helping', 'unload', '1.8', 'decade', 'arrangement', 'unaware', 'arrivals', 'irrelevant', 'commodities', 'desire', '2843-6470', 'companion', 'marble', 'posts', 'h.k.', '14.0', 'exceptional', '56.06', '531.52', 'holdings', 'payable', 'granite', 'distributor', 'spinoff', 'construction', '2843', '6368', 'softbank', 'procure', 'forex', 'acquisition', 'kingston', 'transactions', 'maker', 'memory', 'boards', 'acquisitions', 'telecomm', 'half-year', 'yuan', '115.259', '123.157', '20.318', '22.828', 'asset', '3.02', 'comparative', '0.14', 'unaudited', 'promodes', 'decide', 'spar', 'les', 'echos', 'rothschild', 'cie', 'intermediary', 'unlisted', 'retailers', 'metro', 'rewe', 'lidl', 'discussions', 'promo', 'hypermarket', 'continent', 'superstores', 'generated', '4.7', 'outline', 'specia', 'dia', 'aldi', '4221', '5452', 'highlights', 'lender', 'permanent', 'stalemate', 'claim', 'owed', 'taylor', 'trawler', 'corps', 'cat', 'mouse', 'enterprise', 'employment', 'widened', 'managers', 'ivernia', 'minorco', 'zinc', 'lisheen', 'tipperary', 'crh', 'refused', 'stering', 'tilcon', 'societies', 'antrim', 'protestant', 'driven', 'loyalist', 'paramilitaries', 'yesterday', 'defiance', 'hanging', 'dunnes', 'bankers', 'merrill', 'transferring', 'plastics', 'incineration', 'suitable', 'recycling', 'jv', '1996-08-24', 'truck', 'post-tax', 'jiangling', '3.385', '14.956', '937.891', '1.215', '0.005', '8,333', '9,018', 'vehicle', 'engine', '138.643', '353.24', 'jiangxi', '8.3', 'semifinals', 'rallying', 'kankkunen', 'mcrae', 'rolls', 'jyvaskyla', 'juha', 'impressive', '37', 'stages', 'lakes', 'overshadowed', 'kankunnen', 'prospect', 'gronholm', 'tommi', 'makinen', 'mitsubishi', 'fined', '250,000', 'sports', 'governing', 'rolled', 'subaru', '6.5', 'co-driver', 'ringer', 'unhurt', 'boss', 'richards', 'furious', 'astonishing', 'pace', '!', '37-year-old', 'spaniard', 'sainz', 'turbo', 'bruno', 'thiry', 'transmission', 'shaft', 'grid', '50.574', '226.859', 'kph', '1:50.980', 'ferrari', '1:51.778', '1:51.884', '1:51.960', '1:52.318', '1:52.354', '1:52.977', 'eddie', 'irvine', '1:53.043', '1:53.152', '1:53.199', '1:53.993', 'salo', 'tyrrell', '1:54.095', '14.', '1:54.220', 'diniz', '1:54.700', 'jos', 'verstappen', 'arrows', '1:55.150', '17.', 'ukyo', 'katayama', '1:55.371', '1:56.286', 'lamy', 'minardi', '1:56.830', 'qualify', 'giovanni', 'lavaggi', '1:58.579', 'spectator', 'unnamed', 'danish', 'richardt', 'ploughed', 'two-kilometre', 'host', 'skidded', 'cordoned-off', 'suspended', 'resumed', 'practising', 'quarterfinals', 'suspension', '43-man', 'interrupted', 'schedeled', '+1', '+2', '+3', '+5', 'sigeki', '+7', '+8', '+9', '+11', 'bradford', 'wigan', '78', 'workington', '902', 'helens', '884', '441', '767', '409', 'warrington', '555', '499', '462', 'sheffield', '574', '696', 'halifax', '603', '552', 'castleford', '548', '543', 'oldham', '439', '656', 'leeds', '531', '681', '398', '795', '325', '1021', 'new-ball', 'neil', 'ilott', 'deliveries', 'left-armer', '252', 'slumped', 'derbyshire', 'favour', 'thrust', 'dispatching', 'removed', 'dominic', 'hewson', 'hancock', 'visitors', 'optimistically', 'graham', '532', 'declaring', 'prichard', 'plundered', '88', 'second-placed', 'prevented', '255', 'third-placed', 'uphill', 'notts', '446', 'alistair', '55-ball', 'half-century', 'rain-curtailed', 'fourth-placed', 'ropes', 'intervened', '2-24', 'gordon', 'parsons', '3-20', '2-19', '353', 'rekindled', 'successive', 'defeats', 'arch-rivals', '529', 'follow', '206', '323', 'paceman', 'darren', 'gough', 'polishing', '210', '176', 'b-4', 'lb-3', 'nb-11', '339', '2-239', '3-334', '4-334', '12-1-76-0', '22-6-56-2', '29-6-64-1', '14.3-4-45-1', '17-0-91-0', 'abandoned', '27-4', '532-8', '111', 'irani', 'alleyne', '4-80', 'renshaw', '4-56', 'bovill', '4-102', '81-7', 'ambrose', '6-26', '361', '117', 'ripley', '42-3', '446-9', 'b.', '4-104', '128-4', '205-9', 'spiring', 'watkinson', '4-53', '210-5', 'speak', 'hibernian', 'dunfermline', 'kilmarnock', 'raith', 'motherwell', 'dundee', 'aberdeen', 'airdrieonians', 'fife', 'clydebank', 'greenock', 'morton', 'falkirk', 'partick', 'mirren', 'johnstone', 'berwick', 'stenhousemuir', 'brechin', 'ayr', 'hamilton', 'clyde', 'dumbarton', 'stranraer', 'livingston', 'alloa', 'arbroath', 'cowdenbeath', 'monstrose', 'forfar', 'inverness', 'ross', 'out-of-sorts', 'newcastle', 'teething', 'pacesetters', 'alan', 'shearer', 'keegan', 'talent-laden', 'dejan', 'stefanovic', 'faustino', 'asprilla', 'equalised', 'pembridge', 'glancing', 'header', 'whittingham', 'misery', 'ferdinand', 'stretchered', 'newly-promoted', 'sunderland', 'tottenham', 'hotspur', 'goaless', 'leboeuf', 'gianluca', 'vialli', 'coventry', 'managerless', 'arsenal', 'scoreline', 'aston', 'villa', 'derby', 'ham', 'southampton', 'bolton', 'norwich', 'bromwich', 'crystal', 'ipswich', 'southend', 'birmingham', 'stoke', 'swindon', 'vale', 'wolverhampton', 'barnsley', 'huddersfield', 'brentford', 'luton', 'bristol', 'blackpool', 'kickoff', 'burnley', 'walsall', 'chesterfield', 'bury', 'peterborough', 'crewe', 'preston', 'rovers', 'rotherham', 'shrewsbury', 'stockport', 'watford', 'millwall', 'wrexham', 'wycombe', 'gillingham', 'bournemouth', 'barnet', 'brighton', 'carlisle', 'hull', 'chester', 'darlington', 'swansea', 'exeter', 'scarborough', 'hartlepool', 'fulham', 'hereford', 'doncaster', 'leyton', 'orient', 'mansfield', 'rochdale', 'scunthorpe', 'torquay', '318-2', '318', '0-6', '33-26', 'unbeatable', 'tries', 'springboks', 'enemies', 'wilson', '24-11', 'flanker', 'ruben', 'kruger', 'scrum-half', 'joost', 'westhuizen', 'narrowed', 'gap', '23-24', 'fly-half', 'joel', 'stransky', 'conversion', 'upright', 'scrambled', 'replacement', 'zinzan', 'brooke', '21-11', 'hannes', 'strydom', 'stranksy', 'simon', 'culhane', 'conversions', 'cukaricki', 'hajduk', 'becej', 'borac', 'mladost', 'zemun', 'rad', 'buducnost', 'partizan', 'vojvodina', 'proleter', 'sutjeska', 'sloboda', 'loznica', 'obilic', 'ofk', 'kikinda', 'radnicki', 'spartak', 'beograd', 'bj', 'zeleznik', 'rudar', 'amica', 'wronki', 'hutnik', 'krakow', 'sokol', 'tychy', 'lech', 'poznan', 'rakow', 'czestochowa', 'stomil', 'olsztyn', 'wisla', 'gornik', 'slask', 'wroclaw', 'odra', 'wodzislaw', 'gks', 'katowice', 'polonia', 'zaglebie', 'lubin', 'lks', 'lodz', 'belchatow', 'basketball', 'philippine', 'pro-league', 'manila', 'semi-final', 'milk', 'purefoods', 'hotdogs', '103-95', '34-48', 'half-time', 'ginebra', 'shell', '120-103', '65-56', 'pro-baseball', 'hyundai', 'haitai', 'hanwha', 'ob', 'lotte', 'ssangbangwool', '.606', '.533', '.471', '.455', '.443', '.407', '.359', '.594', '.473', '.446', '.574', '.520', '.630', '.411', '.527', '.430', '.538', '.429', 'gm', 'belenenses', 'boavista', 'slump', 'heerenveen', 'faltered', 'dismal', 'pre-season', 'deadlock', 'interval', 'romeo', 'wouden', 'veldman', 'curled', 'goalkeeper', 'edwin', 'sar', 'marcio', 'winston', 'bogarde', 'jari', 'litmanen', 'overmars', 'equalise', 'gaps', 'dahl', 'tomasson', 'rushed', 'lobbed', 'contenders', 'curtain-raiser', 'groningen', 'liege', 'anderlecht', 'lokeren', 'cercle', 'mouscron', 'antwerp', 'lommel', 'ghent', 'aalst', 'lierse', 'charleroi', 'sint', 'truiden', 'goalscorers', 'anto', 'drobnjak', 'bastia', 'xavier', 'gravelaine', 'marseille', 'miladin', 'becanovic', 'lille', 'enzo', 'scifo', 'monaco', 'smicer', 'lens', 'christopher', 'wreh', 'guingamp', 'nantes', '52nd', '16,000', 'nice', 'debbah', '39th', '6,000', 'boutoille', '79th', 'pen', 'rennes', \"guivarc'h\", 'bordeaux', 'auxerre', 'metz', 'traore', '65th', 'bombarda', '69th', 'strasbourg', 'zitelli', 'havre', 'caen', 'bancarel', '70th', 'lyon', 'caveglia', '89th', '7,000', 'montpellier', 'cannes', 'charvet', '8th', 'saint-germain', 'graafschap', 'doetinchem', 'rkc', 'waalwijk', 'willem', 'tilburg', 'fortuna', 'sittard', 'rotterdam', 'twente', 'enschede', 'vitesse', 'arnhem', 'utrecht', 'feyenoord', 'roda', 'jc', 'kerkrade', 'volendam', 'az', 'alkmaar', 'bochum', '66th', 'arminia', 'bielefeld', 'molata', 'moenchengladbach', 'karlsruhe', '33rd', '45th', 'keller', 'balakow', '61st', 'werder', 'votava', '68th', '32,000', '1860', 'schwabl', 'zorc', '59th-pen', '73rd', 'heinrich', 'bayer', 'leverkusen', 'duesseldorf', 'seeliger', 'freiburg', 'zeyer', 'gaissmayer', '9th', 'polster', '22,500', 'vfb', 'vfl', 'bayern', 'msv', 'duisburg', 'fc', 'linz', 'gak', 'admira', 'wacker', 'sturm', 'linzer', 'ask', 'tirol', 'innsbruck', 'sv', 'salzburg', 'wien', 'ried', 'brings', 'one-day', '102-0', 'waugh', 'tendulkar', '21.4', 'describes', 'ordeal', 'worker', 'cocked', 'penrose', '23-year-old', 'physical', 'manhandling', 'kalashnikovs', 'throat', 'gunmen', 'swerford', 'frederic', 'malardeau', 'assailants', 'ransom', '300,000', '465,000', 'regularly', 'bombardment', 'conventional', 'tanks', 'grenade', 'launchers', 'provides', 'civilians', 'depending', 'whom', 'prize-winning', 'spokeswoman', 'albanian-born', 'fulfilled', 'dearest', 'wish', 'carved', 'role', 'herself', 'helper', 'sick', 'needy', 'marriage', 'crumbled', 'heir', '85-year-old', 'praying', 'caring', 'respirator', '339-4', 'nijmeh', 'nasr', 'arabia', 'issa', 'alloush', 'adventurers', 'wilderness', 'pemberton', 'climb', 'raft', 'bike', '323-mile', '517-km', 'endurance', 'eco-challenge', 'adventure', 'perilous', 'physically', 'diverse', 'terrain', 'stroud', 'participant', 'utah', 'maine', 'modelled', 'trek', 'glaciers', 'whitewater', 'horseback', 'ride', 'canoe', 'grueling', 'vancouver', 'treacherous', 'peaks', 'frigid', 'two-thirds', 'participants', 'disqualified', 'hardy', 'first-place', 'finishers', 'racers', 'bones', 'sunstroke', 'dehydration', 'exhaustion', '1996-05-28', 'ubimini', 'oil-rich', 'damian', 'ejiohuo', 'quell', 'safer', 'drinking', 'outbreaks', 'epidemics', 'piped', 'usually', 'malawi', 'ex-president', 'banda', 'blantyre', 'frail', 'kamuzu', 'vegetarian', 'teetotaller', 'unaided', 'walking', 'clutched', 'whisk', 'symbolised', 'obsession', 'undisputed', 'ruler', 'decades', 'all-party', 'acquitted', '1983', 'servants', 'emelia', 'sithole', 'harare', 'zimbabwean', 'defying', 'crippled', 'essential', 'psc', 'mortuary', 'attendants', 'firefighters', 'workplaces', 'summarily', 'dismissed', 'psa', 'unavailable', 'florence', 'chitauro', 'recruiting', 'sub-contracting', 'firms', 'ignored', 'demands', 'wage', 'stretched', 'hospitals', 'tourists', '180,000', 'mugabe', 'civic', 'private-sector', 'unions', 'denounced', 'earn', 'z$', 'kigali', 'trouble-makers', 'camps', 'firmin', 'gatera', 'tutsi-dominated', 'zairean', 'goma', 'tutsi', 'kengo', 'wa', 'dondo', 'expell', 'timeframe', 'genocide', 'tutsis', 'refuse', 'fear', 'reprisal', 'kivu', 'counterpart', 'gisenyi', 'prefect', 'revered', 'skull', 'limelight-loving', 'disgrace', 'prized', 'sacred', 'tribal', 'ancestor', 'middle-aged', 'forensic', 'examined', 'supposed', 'hintsa', 'xhosa', 'tribe', 'cranium', 'nicholas', 'gcaleka', 'skins', 'regalia', 'journeyed', 'wintry', 'hugely', 'publicised', 'witchdoctor', 'ancestors', 'dream', 'colonial', 'beheaded', '1835', 'cottage', 'lonely', 'highland', 'spirit', 'hurricane', 'branding', 'charlatan', 'shape', 'hole', 'bullet', 'reasonable', 'arrests', 'sewing', 'smugglers', 'smuggle', 'machines', 'clothing', 'eritrea', 'government-owned', 'al-ingaz', 'al-watani', 'banat', 'kassala', 'alliance', 'subversive', 'laying', 'landmines', 'accuses', 'eritrean', 'accusing', 'umbrella', 'asmara', 'congress', 'jettisoning', 'stalinist', 'dictatorship', 'balkan', 'approve', 'concepts', 'turn', 'social-democratic', 'electoral', 'class', 'ideological', 'zeri', 'popullit', 'fatos', 'nano', 'sali', 'berisha', 'reformed', 'heirs', 'sham', 'acting', 'servet', 'pellumbi', 'scrap', 'ideas', 'karl', 'marx', 'pro-reform', 'stance', 'triggered', 'gramoz', 'ruci', 'commentators', 'rift', 'unlikely', 'nicaraguan', 'managua', 'nicaragua', 'violeta', 'chamorro', 'check-up', 'column', 'examination', 'suffers', 'osteoporosis', 'weakens', 'longtime', 'wo', 'tool', 'one-week', 'nepalese', 'vigilance', 'intentions', 'restive', 'four-decade', 'widespread', 'activists', 'birenda', 'gyaicain', 'norbu', 'tourism', 'hangs', 'tehran', 'hanged', 'traffickers', 'shiraz', 'resalat', '419', 'kilograms', '924', 'lbs', 'opium', 'pedestrain', 'executions', 'revolutionary', 'pedestrian', 'site', 'executed', 'grammes', 'lb', 'punishable', 'drug-related', 'addicts', 'transit', 'smuggled', 'tunisian', 'hq', 'tunisia', 'rent', 'khalfallah', 'mds', 'bailiff', 'accompagnied', 'enable', 'represented', 'owing', 'sentences', 'moada', 'khemais', 'chammari', 'disclosing', 'secrets', 'judicial', 'proceedings', 'boulahya', 'founding', 'politically', '1978', 'mestiri', 'withdrew', 'succeeding', 'liberals', 'ben', 'jaafar', 'nicosia', 'irna', 'affiliated', 'shelled', 'kanie', 'karzhala', 'camp', 'arbil', 'puk-run', 'pounding', 'kurdish-controlled', 'iranian-backed', 'brokered', 'persuaded', 'shattering', 'patrolling', 'skies', 'shield', 'violating', '1980-88', 'majid', 'takht', 'ravanchi', 'allegations', 'boutros', 'boutros-ghali', 'constructing', 'observation', 'installing', 'mortars', 'anti-aircraft', 'cannons', 'tents', 'penetrating', 'rifle', 'grenades', 'eight-year', 'u.n.-sponsored', 'jumhouriya', 'chamber', 'urges', 'offers', 'ships', 'iraq-bound', 'aqaba', 'flare-up', 'booms', 'shadow', 'supermarkets', 'completes', 'qadissiya', 'denounces', 'warplanes', 'lambasts', 'liaising', 'babel', 'blaming', 'dirty', 'laurence', 'mcquillan', 'intends', 'gathering', 'nominate', 'parade', 'designed', 'highlight', 'dim', 'glow', 'just-concluded', 'conclave', 'dole', 'carefully', 'orchestrated', 'bills', 'republican-controlled', 'proudly', 'sixty', 'registry', 'sex', 'criminals', 'wherever', 'creation', 'underway', 'finger', 'janet', 'reno', 'footnotes', 'fbi', 'again', 'heads', 'stretch', 'drive', 'happen', 'chess', 'minimium', 'easier', 'pre-existing', 'overhauling', 'remarkable', 'offering', 'demanding', 'responsibility', 'stronger', 'sense', 'families', 'theme', 'departs', 'kentucky', 'michigan', 'indiana', 'fellow', 'attention', 'focus', 'correspondents', 'programmes', 'showcased', 'lead-in', 'concentrating', 'mccurry', 'delivers', 'acceptance', 'map', 'guides', 'veer', 'edouard', 'swirled', 'forecasters', 'winds', 'mph', '185', 'forecaster', 'lixion', 'avila', 'indicate', 'west-northwest', '1,130', 'lesser', 'antilles', 'latitude', 'longitude', '44.2', 'eta', 'basque', 'ignacio', 'olascoaga', 'mugica', '1960s', '1997--ruehe', 'volker', 'ruehe', 'nato-led', 'ifor', 'bild', 'sonntag', 'mandate', 'expires', 'completely', 'excerpts', 'publication', 'impression', 'deployment', 'perceived', 'massacres', 'comics', 'independence-joke', 'bossi', 'orvieto', 'joke', 'umberto', 'ancient', 'etruscan', 'mock', 'cimicchi', 'actor', 'benigni', 'declare', 'etruria', 'proceed', 'annexation', 'sardinia', 'corsica', 'ironically', 'proclamation', 'padania', 'umbria', 'pop', 'balloon', 'rhetoric', 'talking', 'intensified', 'nationally', 'federalism', 'wasteful', 'centralised', 'bureaucracy', 'northerners', 'farmer', 'mutilated', 'verona', 'homocide', 'mutilating', 'bodies', 'ansa', 'gianfranco', 'stevanin', '35-year-old', 'magistrate', 'unable', 'recall', 'remembering', 'lifeless', 'sadmasochistic', 'assaulting', 'prostitute', 'murdering', 'corpses', 'headless', 'decomposed', 'sack', 'canal', 'cesare', 'dal', 'maso', 'beheading', 'dumping', 'adige', 'interrogations', 'investigators', 'suffocated', 'digging', 'passer-by', 'asks', 'paedophile', 'eluded', 'jeremy', 'lovell', 'child-sex', 'scandal', 'kidnapping', 'pornography', 'shockwave', 'revulsion', 'recriminations', 'rapist', 'dutroux', 'managed', 'prey', 'unhindered', 'starvation', 'freed', 'dungeon-like', 'compartment', 'ransart', 'mont-sur-marchienne', 'suburbs', 'abduction', 'imprisonment', 'molest', 'youngsters', 'proof', 'michel', 'bourlet', 'chase', 'porn', 'tapes', 'featured', 'dungeon', 'basement', 'euphoria', 'rescue', 'disgust', 'eight-year-old', 'lejeune', 'melissa', 'russo', 'kidnapped', 'starved', 'marchal', 'eefje', 'lambrecks', 'unknown', 'prostitution', 'bratislava', 'accomplice', '74-year', 'dutchman', 'disappearance', 'high-level', 'accomplices', 'leaked', 'cataloguing', 'degree', 'bungling', 'incompetence', 'indifference', 'revelations', 'gendarmerie', 'surveillance', 'codenamed', 'othello', 'gendarmes', 'cells', 'theft', 'accepted', 'cries', 'hear', 'justice', 'stefaan', 'clerck', 'inquiry', 'stressing', 'indications', 'cover-up', 'disbelief', 'unemployed', 'visible', 'toll', 'seven-newspaper', 'home-made', 'bou', 'haroun', 'explosive', 'device', 'prematurely', 'el-watan', '25-year-old', 'boys', 'five-year-old', 'explosion', 'four-year-old', 'strife', 'government-appointed', 'watchdog', 'observatory', '1,400', 'seize', 'cannabis', 'chilli', 'sauce', '7.5', 'container', 'freeport', 'haul', 'flames', 'motorway', 'injuring', 'steinberg', 'spaniards', 'rebels--poll', 'madrid', 'renounced', 'permanently', 'mundo', 'supported', 'state-controlled', 'sociological', 'achieving', 'ortega', 'lara', 'worsened', 'pp', '2,496', 'margin', 'error', 'minus', 'thirty', 'floods', 'plunge', 'lahore', 'chaos', 'flood-hit', 'pakistani', '461', 'inches', 'drenched', 'punjab', 'rivers', 'knocking', 'disrupting', 'rail', 'witnesses', 'jamaat-i-islami', 'drowned', 'homeless', 'breach', 'inundating', 'residential', 'evacuate', 'low-lying', 'ravi', 'chenab', 'flood', 'internet', 'startup', 'java', '1996-08-25', 'engineers', 'microsystems', 'javasoft', 'fledgling', 'ground-floor', 'venture', 'bessemer', 'menlo', 'calif', 'founder', 'bidzos', 'rsa', 'dynamics', 'verisign', 'doors', 'initial', 'combines', 'experience', 'apple', 'oracle', 'portends', 'dramatic', 'bui', 'engineer', 'programming', 'mid-1995', 'manner', 'silicon', 'kleiner', 'perkins', 'caufield', 'byers', 'startups', 'developing', 'licensed', 'prasad', 'wagle', 'aims', 'networked', 'ubiquitious', 'applets', 'downloaded', 'server', 'individual', 'zuleeg', 'marketing', 'web', 'www.internetstartup.com', 'pioneers', 'psi', 'birdied', 'even-par', 'mayfiar', '277', 'accomplish', 'three-stroke', 'exemption', 'pga', '378,000', '1,574,799', 'style', 'easy', 'three-putted', 'feet', 'tee', 'bogeys', '12th', 'parred', 'birdie', 'no.2', 'wedge', '17th', '6-iron', 'bogeyed', 'putt', 'runner', 'sudden', 'defending', 'contention', '14th', '7149', '274', '281', '283', '284', '285', '287', '288', '289', '290', '292', '294', '295', '298', 'luke', 'jensen', 'murphy', 'handrik', 'dreekmann', '6-0', 'jyvasklya', 'lancer', 'celica', '2:09', 'jarmo', 'kytolehto', '2:23', 'eriksson', 'impreza', '2:39', '3:03', 'motocross', '500cc', 'landskrona', 'smets', 'husaberg', 'husqvarna', 'gert', 'doorn', 'honda', 'jacky', 'martens', 'dirkx', 'ktm', 'danny', 'theybers', 'shayne', 'boonen', 'dietmar', 'lalcher', 'claus', 'manne', 'nielsen', '236', 'lacher', '219', 'darryll', '178', '125cc', 'holzgerlingen', 'tortelli', 'kawasaki', 'moore', 'yamaha', 'luigi', 'seguy', 'andi', 'kanstinger', 'charlier', 'camerlengo', 'belometti', 'vialle', 'collin', 'dugmore', '432', 'malin', '317', '293', '192', 'michele', 'fanton', '152', 'placings', 'pokka', 'suzuka', 'gt', 'ray', 'belim', 'j.j.lehto', 'fi', 'gtr', 'laps', '48.637', '158.82', 'olofsson', 'luciano', 'della', 'noce', 'ennea', 'f40', '170', 'ballace', 'grouillard', 'harrods', 'bscher', 'kox', 'f1', '168', 'fabien', 'giroix', 'jean-denis', 'deletraz', 'muller', '167', 'owen-jones', 'pierre-henri', 'raphanel', 'brabham', 'jean-marc', 'gounon', 'belmondo', 'eichmann', 'gerd', 'ralf', 'kelleners', 'gt2', 'roock', '911', '164', 'ortelli', 'wollek', 'konrad', 'cor', 'euser', 'h.', 'wada', 'furuya', 'lm600', '162', '03.684', '170.680', '156', '98', 'sarka', 'kasparkova', '14.84', 'ashia', 'hansen', '14.78', 'rodica', 'matescu', '14.18', 'deon', 'hemmings', '55.13', 'marken', '55.90', '56.00', 'javelin', 'isel', 'mcpaul', '60.66', 'silke', 'renk', '22.53', '22.58', '22.77', '12.83', '12.91', 'gillian', 'charmaine', 'crooks', '00.42', 'inez', '2:01.98', 'margaret', '2:02.40', 'vault', 'trond', 'bathel', '5.60', 'pat', 'manson', 'lobinger', 'pukstys', '86.82', 'backley', '82.20', 'nieland', '81.12', 'marcel', '51.50', '52.17', 'phylis', '52.53', '20.48', 'regis', '20.63', 'austin', '2.30', 'forsyth', 'patrik', 'sjoberg', '2.25', 'verbjorn', 'rodal', '1:44.93', 'benson', '1:45.96', 'vincent', 'malakwen', '1:46.18', '3:54.57', '3:54.60', 'whiteman', '3:54.87', '45.05', '45.38', '45.48', 'osmond', '10.06', 'mackie', '10.17', '10.19', '15.125', '208.442', '5.602', '15.710', '19.125', '29.179', '29.896', '1:00.754', '1:40.227', 'netherland', '1:53.067', '221.857', 'spa-francochamps', 'drivers', 'constructors', '149', 'footwork', '1:46', '1:56', '2:05', 'radstrom', 'motorcycling', 'superbike', 'sugo', 'yuuchi', 'takeda', '30.054', 'noriyuki', 'haga', '38:30.140', 'wataru', 'yoshikawa', '38:32.353', 'corser', 'ducati', '38:34.436', 'kocinski', '38:36.306', 'aaron', '38:41.756', 'norihiko', 'fujiwara', '38:43.253', 'fogarty', '38:49.595', 'akira', 'ryo', '38:50.269', 'shiya', 'takeishi', '38:52.271', '147.159', 'takuma', 'aoki', '38:18.759', '38:19.313', '38:32.040', '38:32.149', '38:32.719', '38:33.595', '38:34.682', '38:34.999', '38:35.297', '38:42.015', '147.786', '269', '254', 'pier', 'francesco', 'crafar', 'gobert', 'hodgson', 'disqualification', 'carburettor', 'keiichi', 'kitigawa', 'suzuki', '38:42.333', '270', '238', 'yuuichi', 'outclassed', 'names', 'poise', 'overtake', 'pursued', 'duo', 'chicane', 'spurt', 'flag', 'consolation', 'recording', 'limped', 'challenged', 'strongly', 'elder', 'brother', 'haruchika', 'race-long', 'duel', 'chequered', 'regained', 'unlucky', 'riders', 'alter', '611', '667', '576', '730', '473', '745', 'concludes', 'flourish', 'concluded', '154', 'interruption', 'spare', 'byas', 'reaching', '205', 'sword', 'collecting', 'hinchcliffe', 'glenn', 'hoddle', 'uncapped', 'left-back', 'anderton', 'recurring', 'groin', '74-0', '521-8', 'cruyff', 'solskjaer', 'warhurst', 'bohinen', '51st', '54,178', 'lb-5', 'nb-16', '521', '5-365', '6-440', '7-502', '8-519', '23-3-112-0', '37.1-7-97-3', '47-10-116-2', '23-5-71-1', '29-3-116-1', '7-0-35-0', '7-1-24-0', '7-2-11-0', '2-1-4-0', '473-6', 'tea', 'run-out', 'slim', 'satisfaction', 'omission', 'reasserting', 'dominance', 'fielding', 'disciplinary', 'touring', 'batted', '413', '87', 'solitary', 'attempting', 'lurking', 'prove', 'swooped', 'alec', 'whipped', 'bails', 'waves', 'alarms', 'rattled', 'outscoring', 'forcing', 'ground-staff', '1445', '1345', 'maynard', 'ronnie', 'adam', 'hollioake', 'headley', 'togo', 'congo', 'lome', 'salou', 'bachirou', '53rd', 'crvena', 'zvezda', 'zelesnik', 'bogdan', 'prusek', 'slawomir', 'wojciechowski', 'jacek', 'dembinski', 'widzew', 'marcin', 'mieciel', 'wieczorek', 'berensztain', 'marek', 'citko', 'fedoruk', 'dariusz', 'jackiewicz', 'bartlomiej', 'jamroz', 'tomasz', 'moskal', 'krzysztof', 'piskula', 'mariusz', 'srutwa', 'emmanuel', 'tetteh', 'warszawa', 'zagorski', 'bucharest', 'a.s.', 'bacau', 'ceahlaul', 'piatra', 'neamt', 'otelul', 'galati', 'arges', 'dacia', 'pitesti', 'farul', 'constanta', 'chindia', 'tirgoviste', 'sportul', 'studentesc', 'universitatea', 'craiova', 'petrolul', 'ploiesti', 'politehnica', 'timisoara', 'brasov', 'jiul', 'petrosani', 'dinamo', 'cluj', 'steaua', 'alaniya', 'zhemchuzhina', 'sochi', 'baltika', 'kaliningrad', 'zenit', 'petersburg', 'chernomorets', 'novorossiisk', 'rostselmash', 'rostov', 'lokomotiv', 'torpedo', 'rotor', 'volgograd', 'cska', 'kamaz', 'naberezhnye', 'chelny', 'lada', 'togliatti', 'tekstilshik', 'kamyshin', 'krylya', 'sovetov', 'samara', 'nizhny', 'novgorod', 'uralmash', 'yekaterinburg', 'precedence', '49', 'tekstilshchik', 'rules-afl', 'rules', 'adelaide', '14.12', 'collingwood', '153', '151', '11.12', '28.19', 'fitzroy', 'carlton', '13.18', 'footscray', '9.12', 'essendon', '14.16', '12.10', 'kilda', 'hawthorn', 'brisbane', '10.11', 'fremantle', 'geelong', '16.13', '2123', '1631', '130.2', '2067', '1687', '122.5', '2151', '1673', '128.6', '2385', '1873', '127.3', '2009', '1844', '108.9', '2288', '117.9', '2130', '109.4', '2173', '1803', '120.5', '1791', '1820', '98.4', '1909', '1958', '97.5', '2103', '2091', '100.6', '2158', '2183', '98.9', '1642', '2361', '69.5', '1912', '87.5', '1578', '2060', '76.6', '1381', '2778', '49.7', 'bulldogs', 'queensland', 'illawarra', 'penrith', 'manly', 'parramatta', 'auckland', 'premiership', '501', '569', '257', '560', '487', 'cronulla', '359', '258', '502', '374', '421', '344', '366', '426', '406', '309', '435', '388', '391', '356', '395', '297', '448', '593', '351', '483', '304', '586', '460', '1-15', '15-1', 'marlene', 'thomsen', 'lisbet', 'stuer-lauridsen', 'qiang', 'lu', '10-15', '17-16', 'yap', 'cheah', 'kit', 'wan', 'chong', 'tan', 'fook', '0*', '*note', '.610', '.547', '.537', '.534', '.467', '.439', '.357', '.589', '.569', '.470', '25th', '.633', '.462', '.454', '.408', '.426', '.542', '.515', 'sneak', 'rafael', 'palmeiro', 'two-out', 'alomar', 'berth', 'trailed', 'kyle', 'abbott', 'sacrificed', 'mariner', 'bragg', '9-5', 'contact', 'seitzer', 'hulse', 'extra-inning', 'wickman', 'acquired', 'marty', 'cordova', 'lawton', '6-5', 'yeah', 'ballpark', 'wally', 'whitehurst', \"o'neill\", 'sixth-inning', 'triple-a', 'columbus', 'defeating', 'cardinals', 'padres', 'rosado', 'tucker', 'six-game', '9-2', 'cellar-dwellers', '5-3', '8-2/3', '21-year-old', 'left-hander', '29-2/3', 'braves', 'cubs', 'mcgriff', '5-for-5', 'clontz', 'eight-hitter', 'ellis', 'burks', 'rockies', 'pirates', '9-3', 'vinny', 'castilla', 'dante', 'bichette', '44-20', 'kurt', 'marlins', 'tired', 'candiotti', 'piazza', 'hollandsworth', 'dodgers', '8-9', 'season-high', 'joey', 'rickey', 'league-record', 'leadoff', 'phillies', '12-7', 'segui', 'expos', 'shut', 'giants', 'lasted', '1-1/3', 'eight-plus', 'orlando', 'stottlemyre', 'astros', 'virtual', 'nl', 'shane', 'reynolds', '16-6', 'five-hitter', 'kicked', 'setubal', 'squeeze', 'equaliser', 'jardel', 'string', 'opportunities', 'redeemed', 'netting', 'skilful', 'counter-attack', 'unmarked', 'chiquinho', 'conde', 'keeper', 'andrejez', 'wozniak', 'braga', 'rodrigo', 'carneiro', 'bookable', 'lack', 'first-class', 'apparent', 'valdo', 'knee', 'paulao', '81st', 'baltasar', 'tripped', 'referee', 'nose', 'idalecio', 'whistle', 'guimaraes', 'gil', 'vicente', 'fiorentina', 'batistuta', 'perfect', 'birthday', 'supercup', 'serie', '1926', 'marked', 'schwarz', 'lob', 'franco', 'baresi', 'montenegrin', 'savicevic', 'weaving', 'checking', 'left-footed', 'toldo', 'desailly', 'fouled', 'boca', 'juniors', 'oscar', 'tabarez', 'rammed', '83rd', 'curling', 'dipping', 'batigol', 'adoring', 'reward', 'weah', 'baggio', 'davids', 'substitute', 'supercoppa', '29,582', 'norwegian', 'tromso', 'kongsvinger', 'valerenga', 'skeid', 'stabaek', 'stromsgodset', 'molde', 'bodo', 'glimt', 'viking', 'rosenborg', 'lillestrom', 'duisberg', 'zieger', 'witechek', 'aarau', 'grasshopper', 'lucerne', 'lugano', 'basle', 'neuchatel', 'gallen', '480,618', 'montgomerie', '429,449', '301,972', '291,088', 'mcnulty', '254,247', '253,337', '246,077', '233,713', '229,360', '211,175', 'nobilo', '209,412', '208,978', '207,990', '202,593', '188,143', '181,005', '172,580', '170,952', 'payne', '165,150', '156,996', 'cycling', '232-km', 'ferrigato', 'bartoli', 'museeuw', 'lance', 'armstrong', 'casagrande', 'alessandro', 'baronti', 'vandenbroucke', 'fabio', 'baldato', 'maurizio', 'fondriest', 'jalabert', 'zanini', 'gontchenkov', 'gabriele', 'tchmil', 'sciandri', 'sprints', 'sprinted', 'weekends', 'similarly', 'narrow', '237km', 'pack', 'oerlikon', 'velodrome', 'faded', 'briton', 'torrential', '193', '199', '201', 'heinz-peter', 'thul', '203', 'emerson', 'baker', 'gorre', 'ernest', 'faber', 'ronald', 'waterreus', 'amends', 'corner', 'romano', 'dimissal', 'zeljko', 'petrovic', 'dismissal', 'atteveld', 'erwin', 'looi', 'gaston', 'taument', 'newly', 'pablo', 'genk', 'harelbeke', 'mechelen', 'wanrooy', '7,032', 'hoogma', 'roelofsen', '7th', '27,500', '20th', 'godee', 'arum', '73th', 'hamming', '7,250', 'arnold', 'haldtime', '11,500', '74th', '0.', '13,500', 'blind', 'endt', 'anp', 'selection', 'devote', 'sidhu', 'opener', 'navjot', 'singh', '50-day', 'quitting', 'right-handed', 'forfeit', 'mohali', 'chandigarh', 'azharuddin', 'sachin', 'four-nation', 'singer', 'sahara', '1996-08-26', 'relive', 'sean', 'fitzpatrick', 'revisited', 'magic', 'moments', 'momentous', 'nzpa', 'first-ever', '50,000-seat', 'loftus', 'versfeld', 'magnificent', 'relived', 'moves', 'tackles', 'emotions', 'three-pointer', 'maul', 'halfback', 'marshall', 'openside', 'emptied', 'punching', 'bucks', 'spontaneous', 'bunce', 'exhausted', 'gutted', 'nowhere', 'choice', 'riding', 'amazing', 'two-try', 'winger', 'buggered', '4000', 'zealander', 'supporters', 'partying', 'goodwill', 'hart', 'rang', 'congratulations', 'thanked', 'understand', 'tremendous', 'afl', 'league-australian', 'apartheid', 'enforcers', 'subpoenas', 'dig', 'beneath', 'rationales', 'sinister', 'whites', 'archbishop', 'desmond', 'tutu', 'paint', 'f.w.', 'klerk', 'thabo', 'mbeki', 'apologies', 'currin', 'hearings', 'confessional', 'personally', 'crimes', 'testify', 'separate', 'amnesty', 'souls', 'tell', 'confess', 'abuses', 'testimony', 'deeds', 'self-confessed', 'hit-squad', 'dirk', 'coetzee', 'boraine', 'voluntarily', 'hardline', 'p.w.', 'botha', 'advising', 'regarded', 'achieve', 'totality', 'cited', 'confessing', 'interviews', 'tricks', 'prosecutions', 'submissions', 'anc', 'constand', 'viljoen', 'unsatisfied', 'apartheid-era', 'submission', 'caller', 'utterly', 'useless', 'jannie', 'gagiano', 'doubted', 'implemented', '1948', 'dismantling', 'burden', 'guilt', 'exculpated', 'therefore', 'doubts', 'reconciling', 'yourself', 'historical', 'adversary', 'lodge', 'witwatersrand', 'demurred', 'irritation', 'jokes', 'anger', 'express', 'moral', 'uneasiness', 'percolating', 'downwards', 'serb-held', 'samir', 'arnaut', 'matuzici', 'farce', 'incomers', 'cementing', 'partition', 'post-war', 'doboj', 'banners', 'moslem-led', 'moslems', 'angered', 'provision', 'western-organised', 'billed', 'reintegrate', 'multi-ethnic', 'shaping', 'facto', 'jure', 'dayton', 'truly', 'edhem', 'efendija', 'camdzic', 'imam-in-exile', 'upon', 'reuf', 'mehemdagic', 'municipality-in-exile', 'eleven', 'thousand', 'reintegration', 'refugee', 'thrown', 'warning', 'ejup', 'ganic', 'fortune', 'loud', 'applause', 'untie', 'knot', 'ensured', 'croat', 'mobs', 'impassable', '1992-95', 'serb-controlled', 'beefed', 'emotional', 'inter-entity', 'boundary', 'dispersed', 'scuffled', 'blaze', 'deliberately', 'casinos', 'communism', 'wide-ranging', 'engaged', 'pullout', 'shatoi', 'anatoly', 'shkirko', 'disarmed', 'cameraman', 'liutauras', 'stremaitis', 'carriers', 'lorries', 'suspending', 'movladi', 'udugov', 'maverick', 'element', 'leftist', 'mexican', 'epr', 'operated', 'assertions', 'commanders', 'jornada', 'overthrowing', 'guerrero', 'irrational', 'radicals', 'erp', 'fatigues', 'brandishing', 'southwestern', '23,000-strong', '37-page', 'manual', 'detailing', 'tactics', 'strategies', 'basic', 'apparatus', 'bourgeoisie', 'granted', 'volatile', 'protesters', 'violently', 'unrelated', 'zapatista', 'chiapas', 'combat', 'skirmishes', 'gunned', 'northwest', 'unidentified', 'dragged', 'ot', 'antioquia', 'killings', 'municipality', 'anza', 'medellin', 'linking', 'farc', 'impunity', 'unconfirmed', 'bloodshed', 'paramilitary', 'tauranaga', 'climbs', '9.050', '6.03', 'burma', 'mae', 'sot', 'burmese', 'splinter', 'ambushed', 'patrol', 'buddhist', 'dkba', 'col', 'suvit', 'maenmuan', 'allied', 'rangoon', 'infiltration', 'intrusions', 'reinforcements', 'porous', 'frontier', 'anti-rangoon', 'knu', 'intermittent', 'inhabitants', 'villages', 'contol', 'reject', 'explanation', 'supplies', 'directs', 'f-14', 'catches', 'tyre', 'gurion', 'wheel', 'yehiel', 'amitai', 'pilots', 'brigade', 'jars', 'reveal', 'mummies', 'archaeologists', 'pots', 'egyptians', 'burial', 'rites', 'mummification', 'saleh', 'museum', 'contain', 'intestines', 'tomb', 'dahshour', 'pyramid', 'pharaoh', 'seneferu', 'metropolitan', 'canopic', 'unguent', 'unidentifed', 'dynasty', '1991-1786', 'bc', 'finding', 'contains', 'substances', 'conservation', 'cavity', 'analysis', 'liquids', 'executes', 'robbers', 'shabir', 'ahmad', 'jalil', 'mecca', 'beheads', 'rapists', 'murderers', 'tamper', 'stability', 'tolerated', 'marwan', 'muasher', 'disturbances', 'bahrain', 'al', 'rai', 'abdul-karim', 'al-kabariti', 'commited', 'ceiling', 'sultan', 'telephones', 'releases', 'expresses', 'traditions', 'ad', 'dustour', 'kabariti', 'reactivate', 'legislative', 'aswaq', 'weizman', 'consult', 'ezer', 'weighing', 'consulted', 'yedioth', 'ahronoth', 'aryeh', 'shumer', 'fitting', 'proces', 'cool', 'bombers', 'haaretz', 'donated', 'opposes', 'maariv', 'education', 'columns', 'erekat', 'avraham', 'tamir', 'establish', 'puts', 'kahalani', 'warns', 'voting', 'lebanese', '580,000', 'voters', 'eligible', 'choose', '128-member', 'thin', 'trickle', 'casting', 'ballots', 'polling', 'stations', 'invites', 'caesarea', 'ceremonial', 'architect', 'spoken', 'frequently', 'urging', 'employee', 'skilled', 'nicely', 'contribute', 'consulting', 'towers', 'perrin', 'performs', 'accountant', 'salary', 'sandra', \"o'neal\", 'principal', 'evaluated', 'solely', 'skill', 'abilities', 'skills', 'creative', 'sensitive', 'customer', 'needs', 'productivity', '750', 'mid-to-large', 'corporations', 'surveyed', 'restructuring', 'agenda', 'structure', 'skills-based', 'non-management', 'fad', 'inexorable', 'hierarchical', 'concept', 'defined', 'multi-layers', 'competitive', 'emphasis', 'raise', 'eliminate', 'increases', 'bonuses', 'incentives', 'culture', 'rated', 'high-performing', 'decisions', 'high-performance', 'engaging', 'geert', 'clercq', 'neufchateau', 'inquiries', 'georges', 'zicot', 'insurance', 'fraud', 'forgery', 'searches', 'sites', 'thefts', 'gerard', 'pignon', 'warehouse', 'stolen', 'insurer', 'thierry', 'dehaan', 'ring', 'weinstein', 'shockwaves', 'eight-year-olds', 'detroux', 'abducted', 'disagreement', 'thily', 'bregancon', 'funding', 'pubished', 'texts', 'practically', 'chirac', 'riviera', 'fortress', 'widely', '+331', 'muzaffarabad', 'pakistan-ruled', 'azad', 'indian-ruled', 'waged', 'instantly', 'kunar', 'garhi', 'habibullah', 'reopening', 'salang', 'embattled', 'kabul-salang', 'supreme', 'coordination', 'jumbish-i-milli', 'powerful', 'warlord', 'rashid', 'dostum', 'postponement', 'precautions', 'hezb-i-islami', 'gulbuddin', 'hekmatyar', 'rejoined', 'persuade', 'jumbish', 'burn', 'hasina', 'effigy', 'anis', 'battled', 'sheikh', 'bogra', 'barricaded', 'ruling', 'awami', 'battles', 'alight', 'janakantha', 'alleging', 'pro-government', 'batons', 'teargas', 'stones', 'bombs', 'bnp', 'denounce', 'coincided', 'policeman', 'gunshots', 'pro-opposition', 'section', 'grants', 'urged', 'legislators', 'denouncing', 'barbarity', 'rafiqul', 'islam', 'raided', 'arresting', 'outsiders', 'student', 'dormitories', 'seizing', 'stormed', 'halls', 'flushed', 'gunpoint', 'baggage', 'revolvers', 'sawn-off', 'shotguns', 'knives', 'swoop', 'vice-chancellor', 'emajuddin', 'deteriorating', '28,000-student', 'wednedsay', 'gunbattles', 'begum', 'khaleda', 'zia', 'blanket', 'possessors', 'irrespective', 'identities', 'crashes', 'ravine', 'fertile', 'drought', 'irene', 'marushko', 'batkivshchyna', 'collective', 'shiny', 'green-and-yellow', 'deere', 'parked', '1,750-hectare', '4,325-acre', 'grain-growing', 'regions', 'fill', 'agronomist', 'enthusiasm', 'diesel', 'odnosum', 'breakdown', 'machinery', 'loaned', 'ukrainian', 'grain', 'harvest', 'harsh', 'scoured', 'steppes', 'stunting', 'sector', 'transition', 'rich', 'boots', 'reputation', 'breadbasket', 'brutal', 'collectivisation', 'dictator', 'josef', 'stalin', 'quality', 'hryhory', 'borsuk', 'mironivka', 'institute', 'agrarian', 'temperature', 'celsius', '143.60', 'fahrenheit', 'unlit', 'electricity', 'unpaid', 'dry', 'rainfall', 'harvesting', 'strains', 'resistant', 'extreme', 'climate', 'agricultural', 'farms', 'nascent', 'fertiliser', 'herbicides', 'pesticides', 'repair', '36.5', 'worse', 'priced', 'cheaply', 'pigs', 'solutions', 'horizon', '260', 'readying', 'sowing', '5.2', 'hectare', '2.5', 'acres', '3.9', '2.11', 'borrowing', 'two-lane', 'passes', 'occasional', 'horse-drawn', 'buggy', '1,700-hectare', '4,200-acre', 'shevchenko', 'neat', 'tidy', 'decay', 'sypron', 'strapped', 'bartering', '220', 'rickety', 'tractors', 'badly', '160-200', 'soprun', 'dedication', 'harvested', 'autumn', 'item', 'grows', 'resources', 'borkus', 'subsidies', 'pre-soviet', 'hectares', '124', '36,000', 'willing', 'hurry', 'privatising', 'negative', 'swells', 'setbacks', 'melanie', 'cheary', 'swelled', 'attributable', 'streamlined', 'divisional', 'gilbertson', 'happily', 'illusion', 'arising', 'weakness', 'rand', 'relative', '1,803', '1,003', '469', '279', 'impala', 'platinum', 'substantial', 'obvious', 'furnace', 'implats', '4.5350', 'ingwe', 'coal', 'rains', 'forfeited', 'flooding', 'mpumulanga', 'gloom', 'blocking', 'merger', 'lonrho', 'plc', 'disappointment', 'challenges', 'soundly', 'structured', 'prudently', 'financed', 'blessed', 'portfolio', 'world-class', 'businesses', 'disposal', 'malbak', 'disposals', 'pruned', 'concentrate', 'core', 'disposing', 'non-core', 'pruning', 'commodity', 'invested', 'referring', '41.5', 'cheaper', 'snapping', 'liked', 'downturn', 'offshore', '482-1003', 'ivac', 'eli', 'lilly', 'intravenous', 'infusion', 'therapy', 'wholly', 'imed', 'merge', 'pumps', 'fluid', 'patient', 'proprietary', 'disposable', 'combined', 'diego-based', 'provider', 'health-care', 'plants', 'creedmoor', 'n.c.', 'tijuana', 'distributes', 'prodcuts', '120', 'dec.', 'dlj', 'expects', 'unspecified', 'one-time', 'technology-based', 'delivery', 'iv', 'pump', 'regulated', 'volumetric', 'fully', '53.9', 'excluding', '17.4', '112.8', '8.4', '29.2', 'mercer', 'ceo', 'mallinckrodt', 'kuhn', 'regulatory', 'approval', 'morris', 'boosted', '92', 'mirroring', '5,731', 'nasdaq', 'fractionally', '1,143', '666', 'lagged', 'declines', '476/698', '837/763', '30-year', 'treasury', '2/32', '6.96', 'thrashed', '66-14', 'inaugural', 'secured', 'knowsley', '1975', 'rain-soaked', 'hunte', 'grabbed', 'hat-trick', 'martyn', 'sullivan', 'newlove', 'goalkicker', 'bobbie', 'goulding', 'seven-year', 'reign', 'toast', 'broncos', 'scrape', 'end-of-season', 'play-offs', 'sights', 'treble', '2:37', '2:42', '3:22', '4.09', 'sebastian', 'lindholm', '5:17', 'lasse', 'lampi', '12:01', 'madeira', '16:34', 'angelo', 'medeghini', '18:28', 'finn', '1,452-km', 'doubling', 'decisive', 'gearbox', 'maakinen', 'strengthened', 'retirement', 'nearest', 'sharpe', 'superb', 'hapless', 'anchored', 'repaid', 'slice', '4.5', '6.98', 'fee', 'top-draw', 'rush', 'feeding', 'galloped', 'unfavoured', 'arc', 'right-hand', 'under-fire', 'wilkinson', 'booed', 'jeers', 'cheers', '25,860', 'joins', 'three-wicket', '300th', 'becomes', '300-club', 'bowlers', 'imran', 'feat', 'cricketers', 'kapil', 'dev', '434', 'hadlee', '431', 'botham', '383', 'malcolm', 'indies', '376', '362', 'lillee', '355', 'willis', 'gibbs', 'trueman', '307', 'courtney', 'walsh', '208', 'middlesex', '144', '137', '5-43', '323-5', 'llong', '273-5', '118', 'cottey', '142-4', '53-0', '3-12', '164-4', 'weston', '231-7', '4-48', '135-9', '242', '48-1', 'b-6', 'lb-2', 'nb-13', '1-96', '2-136', '3-166', '4-179', '5-187', '6-205', '7-220', '8-238', '9-242', '15.4-1-67-3', '18-3-55-1', '37-10-78-6', '10-3-30-0', 'nb-5', '1-7', '3-0-15-0', '3-0-24-1', '0.4-0-9-0', 'lord', 'requiring', '950', '455', '30-sept', 'falkir', 'montrose', 'rica', 'ronaldo', 'gonzalez', 'salas', 'seychelles', 'gleeson', 'bowed', 'islanders', 'mauritius', 'qualifiers', 'fifa', 'breakthrough', 'mauritian', 'caboche', 'crude', 'tackle', 'responded', 'setback', 'ashley', 'mocude', '50th-minute', 'seychellois', 'favourites', 'botswana', 'windhoek', 'cameroon', 'gabon', 'german-based', 'tanzania', 'shoot-out', 'overcome', 'legs', 'decider', 'elimination', 'humiliating', 'preliminaries', 'mauritania', 'benin', 'nouakchott', 'postponed', 'collated', 'aggregaete', 'kremin', 'kremenchuk', 'vorskla', 'poltava', 'ternopil', 'zaporizhya', 'shakhtar', 'donetsk', 'kryvbas', 'kryvy', 'rig', 'karpaty', 'lviv', 'prykarpattya', 'ivano-frankivsk', 'zirka-nibas', 'kirovohrad', 'chornomorets', 'odessa', 'metalurg', 'dnipro', 'dnipropetrovsk', 'tavria', 'swimming', 'popov', '`serious', 'stabbing', 'freestyle', 'titles', 'rimma', 'maslova', 'expert', 'olympics', 'abdomen', 'roadside', 'watermelon', 'sellers', 'south-west', 'wound', 'kidney', 'ntv', 'worry', 'cheerfully', 'attackers', 'vitaly', 'smirnov', 'swimmer', 'chosen', 'slovak', 'slovan', 'tatran', 'presov', 'artmedia', 'petrzalka', 'jas', 'bardejov', 'dac', 'dunajska', 'streda', 'trnava', 'dukla', 'banska', 'bystrica', 'nitra', 'msk', 'zilina', 'kosice', 'petrimex', 'prievidza', 'rimavska', 'sobota', 'lokomotiva', 'kerametal', 'dubnica', 'hungarian', 'haladas', 'mtk', 'bekescsaba', 'bvsc', 'csepel', 'videoton(*', 'zte', 'debrecen', 'siofok', 'ujpest', 'vac', 'vasas', 'pecs', 'te', 'ftc', 'videoton', 'gyor', 'iii.ker.tve', '*name', 'parmalat', 'fehervar', '+361', 'petra', 'drnovice', 'liberec', 'sk', 'slavia', 'praha', 'ceske', 'budejovice', 'fk', 'jablonec', 'viktoria', 'zizkov', 'banik', 'ostrava', 'teplice', 'boby', 'brno', 'sigma', 'olomouc', 'bohemians', 'karvina', 'hradec', 'kralove', 'kaucuk', 'opava', 'plzen', 'ac', 'atlante', 'atlas', 'azul', 'leon', 'guadalajara', 'monterrey', 'veracruz', 'pachuca', 'toluca', 'puebla', 'unam', 'morelia', 'uag', 'neza', 'necaxa', 'celaya', 'catch', 'homewood', 'sao', 'narciso', 'chartered', 'cbf', 'paulo-santos', 'usual', 'package', 'internacional', 'hectic', 'arrive', 'curitiba', 'botafogo', 'tulio', 'zagalo', 'features', 'top-scorer', 'struggling', 'apertura', 'estudiantes', 'ferro', 'carril', 'oeste', 'independiente', 'gimnasia-jujuy', 'platense', 'huracan', 'lanus', 'huracan-corrientes', 'newell', 'velez', 'sarsfield', 'rosario', 'gimnasia-la', 'plata', 'lorenzo', 'banfield', 'deportivo', 'espanol', 'colon', 'honduras', 'tegucigalpa', 'castro', '3rd', 'enrique', 'centeno', 'pavon', 'cricuma', 'fluminense', 'criciuma', '89-86', '45-46', '.604', '.551', '.463', '.456', 'moroccan', 'rabat', 'widad', 'fes', 'oujda', 'raja', 'casablanca', 'tetouan', 'jeunesse', 'massira', 'meknes', 'settat', 'marrakesh', 'khouribga', 'mohammedia', 'sidi', 'kacem', 'jadida', 'hassania', 'agadir', 'quench', 'thirst', 'afford', 'reads', 'please', 'shade', 'drink', 'plenty', 'fluids', 'advisory', 'concluding', '...and', 'garishly-coloured', 'sun-drenched', 'litre', 'life-sustaining', '4.00', 'incredulous', 'noting', 'notorious', 'gouging', 'insult', 'offended', 'baked', 'lasagna', '8.50', 'yorker', 'rebecca', 'sandwich', 'hungry', 'forked', 'pronounced', 'carol', 'perry', 'chimed', 'ridiculous', 'wine', 'indeed', 'chardonnay', 'zinfandel', '4.75', '4.50', 'alcoholics', '12.50', 'hamburger', 'fries', 'snack', 'thirsty', '16.50', 'cheese', 'whopping', '8.00', 'tuscan', 'tuscany', 'maleeva', 'up-and-comers', 'larry', 'youthful', 'finalist', 'magdalena', 'sunny', '15-year-old', 'honoured', 'straight-sets', '112th-ranked', 'montolio', 'cheery', 'worries', 'overmatched', 'engagement', 'cement', 'flushing', 'meadows', 'bowing', 'floater', 'momentum', 'rhythm', 'tough', 'errors', 'manhattan', 'mourn', 'non-', 'rookie', 'aleksandra', 'olsza', '110th', '18-year-old', 'celebrated', 'removing', 'curtain-raising', 'ringing', 'endorsement', 'newest', 'proven', 'mettle', 'quarters', 'conditioning', 'kilos', 'fast-moving', 'scared', 'undaunted', 'pros', 'big-serving', 'brenda', 'schultz-mccarthy', 'nana', 'miyaga', 'helena', 'sukova', 'prevailed', 'barbara', 'paulus', 'yi', 'jing-qian', 'glad', 'fiasco', 'sweating', 'four-set', 'haas', 'embarrassing', 'cried', 'remaking', 'kids', 'enjoy', 'tradition', 'strict', 'accordance', 'favourtism', 'yvegeny', 'spots', 'ranking', 'approximately', 'outrage', 'tarnished', 'damaging', 'ought', 'usta', '27-year-old', 'focused', 'energies', 'sun-baked', 'grandstand', '11th-seeded', 'lingers', 'homegrown', 'controversy', 'engulfed', 'original', 'bumped', 'unfairness', 'exits', 'benefitted', 'fiddling', '18th', 'deserves', 'anne-gaelle', 'sidot', 'janette', 'husarova', 'miyagi', 'vitoux', 'delgado', 'paraguay', 'henrietta', 'nagyova', 'gala', 'pizzichini', 'schett', 'sabine', 'appelmans', 'cristina', 'torrens-valero', 'spirlea', 'begerow', 'gaidano', 'schnell', '9-7', 'heat', 'dier', 'tramacchi', 'anna', 'kournikova', 'richterova', 'debbie', 'stephanie', 'deville', 'rittner', 'kristina', 'brandi', 'ines', 'gorrochategui', 'grzybowska', 'jaime', 'oncins', 'corina', 'morariu', 'linda', 'wild', 'sung-hee', 'pitkowski', 'meghann', 'shaughnessy', '6-', 'dally', 'randriantefy', 'madagascar', 'elena', 'makarova', 'courtois', 'flora', 'perfetti', 'leander', 'paes', 'neville', 'godwin', 'alexandra', 'fusai', 'jill', 'craybas', 'jecmenica', 'dechy', 'christina', 'jane', 'chi', 'callens', 'nicole', 'bradtke', 'baudone', 'jolene', 'watanabe', 'kandarr', 'tyler', 'sweep', '3-2', 'foster', 'fastball', 'rotate', 'changeup', '3-for-4', 'outslugged', '13-9', 'wilkins', 'ericks', '13-8', 'renteria', 'fielded', 'cleanly', 'boles', 'osvaldo', 'fenandez', 'seven-hitter', 'trenidad', 'hubbard', '6-13', 'gagne', 'run-scoring', 'chad', 'pinch-hits', 'pennants', 'jody', 'reed', 'caminiti', 'bagwell', 'donne', '8-4', '1-1/2', 'shoulder', '.466', '.362', '.592', '.530', '.447', '.573', '.474', '.628', '.405', '.523', '.423', '.545', '.519', 'all-star', 'appearing', 'battling', 'hamstring', '357', 'second-longest', '2,282nd', '13-0', 'pinch-hitting', 'mri', 'mild', 'strain', 'lineup', '1-for-2', 'exiting', '32-year-old', '.307', 'last-place', 'outfielder', 'sammy', 'sosa', 'third-longest', 'baseman', 'jonk', 'guus', 'hiddink', 'wim', '14-month', 'gastel', 'boer', 'bergkamp', 'goey', 'jaap', 'stam', 'reiziger', 'kock', '04', 'witschge', 'aron', 'internazionale', 'seedorf', '31st', 'pizzi', 'pena', '75th', 'esnaider', 'pantic', '263-7', '138', 'scoreboard-australia', 'slater', 'strang', 'whittall', 'bevan', 'brandes', 'hogg', 'b-1', 'lb-8', 'w-3', 'nb-3', '263', '1-48', '2-92', '3-167', '4-230', '5-240', '6-242', '7-263', 'reiffel', 'flemming', '10-1-50-1', '2w', '2nb', '10-1-47-2', '1w', '9-0-41-1', 'flower', '6-0-28-0', '10-0-53-3', '1nb', 'decker', '3-0-17-0', 'shah', '2-0-18-0', 'wishart', 'evans', 'dekker', 'lb-4', 'w-10', 'nb-7', '1-16', '2-16', '3-33', '4-35', '5-56', '6-98', '7-100', '8-120', '9-120', '7-2-13-1', '7-0-24-2', '3w', '3nb', '6-1-23-2', '7-2-24-1', '9-2-26-1', '5-1-24-3', 'day-night', 'toss', 'opt', 'stuart', 'damein', 'fleming', 'eddo', 'heath', 'maputo', 'story', 'mozambican', 'noticias', 'nhamavila', 'lamonts', 'apparel', 'files', 'reorganization', '18:00', 'kirkland', 'wash', 'filed', 'unsecured', 'bondholders', '4.05', '5.67', 'creditors', '3.13', 'non-trade', 'existing', 'capitalization', 'reaches', 'entitling', 'dilution', 'blazing', 'ferry', 'safely', 'guernsey', 'trident', 'emeraud', 'boats', '88-year-old', 'jersey', 'cluster', 'british-ruled', 'north-west', 'schork', 'nationwide', 'balloting', 'irregularities', 'assemblies', 'provisional', 'consider', 'agota', 'kuperman', 'select', 'cancell', 'specify', 'organise', 'rule-making', '600,000', 'electorate', 'pec', 'citizens', 'slated', 'cantonal', 'moslem-croat', 'parliaments', 'representatives', 'three-man', 'dnevi', 'sda', 'municipal-level', 'frowick', 'allege', 'systematically', 'discouraged', 'registering', 'cast', 'ballot', 'majorities', '43-month', 'underpopulated', 'cleansing', 'consolidating', 'voter', 'herald', 'multi-ethnicity', 'bosia-hercegovina', 'soren', 'jessen-petersen', 'run-up', 'nationalistic', 'sectarian', 'card', 'drumming', 'constituencies', 'memories', 'tougher', 'alastair', 'macdonald', 'abandon', 'sobering', 'appointed', 'heady', 'wrap', 'compromise', 'settlement', 'insistence', 'chain-smoking', 'paratroop', 'deadpan', 'putdowns', 'knack', 'arrange', 'ambitious', 'pledging', 'conclude', 'pro-war', 'schemers', 'empty-handed', 'viktor', 'chernomyrdin', 'undisclosed', 'meanwhile', 'departments', 'limb', 'hardly', 'reelection', 'criticising', 'pains', 'insist', 'suddenly', 'profited', 'inadequacy', 'risked', 'face-saving', 'acceptable', 'letting', 'quit', 'encourage', 'tendencies', 'caucasus', 'yastrzhembsky', 'yastrezhembsky', 'offical', 'recover', 'receives', 'packet', 'yugo', 'zastava', 'factory', 'wages', 'revive', 'stubborn', 'strength', 'persist', 'dragutin', 'stanojlovic', 'revival', 'consumed', 'pre-war', 'montenegro', 'kragujevac', 'bitterness', 'stirring', 'branch', 'exaggerated', 'passers', 'gordana', 'kukic', '+381', '222', '4254', '9.1', 'lenders', 'trim', '10.0', 'insurers', 'five-10', 'settlements', 'shrank', 'meagre', '5.5', 'calculated', 'midrates', '5.2420', '3.5486', 'kolumbina', 'bencevic', '385-1-4557075', 'svcd', 'controllers', 'bulatka', 'raichev', '1,380', 'technicians', 'paralyse', 'valkov', 'charter', 'carries', 'resorts', 'minimal', 'servicing', 'lock-out', '230', 'separation', 'liliana', 'semerdjieva', 'naina', 'satisfactory', 'tass', 'clinical', 'treats', 'mrs', 'mironov', 'daughters', 'run-off', 'eye', 'mostostal', 'z', '25-', 'million-zloty', 'convertible', 'piotr', 'grabowski', '10-session', 'grabowksi', 'paying', 'benchmark', '52-week', 'pbr', '1.6', 'exchanged', '2.6', 'book-building', 'proceeds', 'modernise', '+48', '653', '9700', 'kidnaps', 'kidnappers', 'humberto', 'hueite', 'zyrecha', 'jetty', 'kors', 'misael', 'valerio', 'fleeing', 'altamira', 'wisinga', 'aguas', 'zarcas', 'rica-nicaragua', 'santa', 'pocosol', 'supposedly', 'tourist', 'regula', 'susana', 'siegfried', 'nicola', 'fleuchaus', 'bizarre', 'twist', 'julio', 'cesar', 'rojas', 'sentimental', 'attachment', 'photographs', 'rican', 'interacciones', 'ups', 'lowers', 'peso', 'brokerage', '4.3', 'projection', 'economist', 'alonso', 'cervera', 'revisions', 'chiefly', 'fueled', '6.1', 'q4', 'year-end', '7.85-8.15', '8.20-8.50', '9.20-9.40', '25.8', 'loosened', 'boosting', 'commitments', 'schemes', 'debtors', '+525', '728-9560', 'bancomext', 'appreciation', 'drop-off', 'moreno', 'turrent', 'promotion', 'importers', 'dlrs', '1,044', 'dollar-buying', '1,041', 'wire', 'transfers', 'accumulated', 'contributing', 'greenbacks', 'shy', 'typical', 'month-end', 'position-squaring', 'helps', 'limit', '142', 'intra-day', '1,037', 'guillermo', 'londono', '571', '610', '7944', 'hashimoto', 'ryutaro', '10-day', 'latin', 'underwent', 'correct', 'compression', 'johns', 'hopkins', 'inflamation', 'drown', 'venezuelan', 'boating', 'maracaibo', 'sank', 'lake', 'zarraga', 'nighttime', 'spin', 'sinking', 'stern', 'lifejackets', 'banco', 'inject', '3.412', 'pesos', 'auctions', '1.206', '1.000', '525', '728-9559', 'collides', 'fifteen', 'suburban', 'street-level', 'ambulance', 'pylons', 'a.m', 'derailed', 'rear', 'overturned', 'spilling', 'careered', 'bell', 'remarkably', 'nasty', 'gunman', '1996-08-27', 'hunted', 'shore', 'sergeant', 'pearson', 'fagan', 'telephoned', 'distraught', 'cooperating', 'northcote', 'sheds', '16-year-old', 'onlookers', 'disarm', '473-4746', 'fugitive', 'gun', 'unsuccessful', 'disturbed', 'simex', 'brent', 'ipe', 'u.k.', 'petroleum', 'contracts', 'mutually', '+65', '870', '3081', 'slides', '3.31', 's$', '5.85', '0120', '357,000', 'topped', 'soaring', '1.55', '6.05', 'takeover', '8703080', 'operators', '2,342.0', '42.5', '0915', 'ample', 'liquidity', '2,342.00', '42.45', '2,341.5', '42.0', 'respectively', 'deposed', 'pdi', 'sued', 'ousting', 'adjourned', 'out-of-court', 'lawyers', 'discussing', 'diminish', '0.45', '18.0', '18.5', '34.0', '35.0', '52.75', '53.50', '107.0', '2,337', '2,455', 'arlen', 'specter', 'resign', 'riyadh', 'oman', 'dhahran', 'airmen', 'abdullah', 'jeddah', 'shake-up', 'pentagon', 'pennsylvania', 'freeh', 'entirely', 'airways', 'refuelling', 'airbus', 'refuelled', 'surrender', 'asylum', 'dozens', 'u.s.-brokered', 'cooperate', 'offensive', 'dividing', 'warring', 'salahuddin', 'rawandouz', 'indiscriminately', 'dayana', 'priest', 'protected', 'moussa', 'consequences', 'ransacks', 'bedouin', 'al-muntar', 'ransacked', 'encampment', 'expel', 'expansion', 'necklace', 'daughter-in-law', 'rummaging', 'luggage', 'destroying', 'shacks', 'barns', 'jeeps', 'shack', 'amina', 'miracle', 'bedouins', 'encamped', 'zone', 'lerner', 'pursuing', 'desolate', 'premiums', 'comex', 'works', 'aluminum', 'grade', '3.25-3.75', 'a7e', 'a0', 'nominal', '2.00-2.25', 'shg', '5.50-6.00', '3.50-4.00', 'tin', '6.5-8.5', 'ppm', '9.0-10.5', 'nickel', 'melting', '9.0-12.0', 'cathode', '2.50-3.0', 'alloy', 'a380', 'midwest', '65-66', 'turnings', 'low-copper', 'clips', 'no2', 'refined', 'no1', 'bare', 'burnt', 'batteries', '6.0', 'producer', 'transaction', 'alcan', 'p1020', 'ingot', 'extrusion', 'billet', 'noranda', 'date:august', 'rsr', 'pure', 'doe', 'asarco', '859', '1646', 'fort', 'lauderdale', 'fla.', 'backyard', 'nervous', 'teasing', 'parkway', 'younger', 'bedtime', 'tree', 'paramedics', 'broward', 'sheriff', 'stool', 'flashlight', 'cbot', 'bounce', 'oversold', 'remains', '450', 'cwt', '10.28', '312-408-8721', 'talbott', 'strobe', 'second-ranking', 'georgy', 'mamedov', 'pattern', 'calendar', 'fairly', 'haiti', 'hog', '1.50', 'sparked', 'packers', 'iowa', '59.50', '60.00', 'illinois', 'matching', '59.00', '57.50', '58.00', 'hogs', 'marketings', 'ship', 'prepares', 'janis', '312-983-7347--', 'gore', 'presents', 'posner', 'mild-mannered', 'meek', 'front-line', 'newt', 'gingrich', 'renominate', 'anxiously', 'thrusting', 'grip', 'scream', 'wishful', 're-election', '15-hour', 'marshal', 'pro-israel', 'stiff', 'transformed', 'energetic', 'gesturing', 'pol', 'ripped', 'favorite', 'foil', 'roaring', 'personifaction', 'evil', 'mentioning', 'housing', 'kemp', 'ignorance', 'audacity', 'two-headed', 'monster', 'whoops', 'downtown', '48-year-old', 'taste', 'nominations', 'painted', 'horrors', 'republicans', 'liberties', 'withering', 'vine', 'polluters', 'productive', 'vision', 'builds', 're-elect', 'deja-voodoo', 'warmed-over', 'ditch', 'ridiculed', 'defense', 'praised', 'courage', 'regulations', 'dairy', 'comparison', 'tolerate', 'aloft', 'inflated', 'vetoing', 'repeal', 'criticized', 'slashing', 'starker', 'reeve', 'mix', 'adversity', 'latter', 'advocate', 'politicians', 'rep', 'gephardt', 'daschle', 'thumbnail', 'profiles', 'speakers', 'reagan', 'passage', 'handgun', 'campaigned', 'nonstop', '1981', 'requires', 'mandatory', 'five-day', 'handguns', 'mandates', 'background', 'checks', 'would-be', 'purchasers', 'hinckley', 'brain', 'congressmen', 'comic', 'hero', 'superman', 'movies', 'heroics', 'accomplished', 'horses', 'shattered', 'neck', 'vertebrae', 'equestrian', 'culpepper', 'paralyzed', 'extensive', 'fuse', 'spine', 'semi-upright', 'classically', 'prototypical', 'handsome', 'performed', 'soap', 'operas', 'plucked', 'sequels', 'mr', 'ambitions', 'milkman', 'consummate', 'congressional', 'insider', 'sufficiently', 'legislature', 'often-unruly', 'republican-led', 'republican-written', 'advocated', 'deficits', 'abortion', 'red-haired', 'square-jawed', 'fiery', 'orator', 'nomination', 'recreated', 'firebreathing', 'reformer', 'dakota', 'surprisingly', 'presented', 'moderate', 'steamrollered', 'vastly', 'dispelled', 'outmaneuvering', 'scrapping', 'gas', 'prairie', 'legislation', 'protecting', 'compensating', 'sickened', 'agent', 'orange', 'defoliant', 'spraying', 'vietnam', 'healthcare', 'water-carrier', 'republican-initiated', 'adult', 'adoptive', 'dallas', 'mccullough', 'gunshot', 'oklahoma', 'shotgun', 'arguments', 'recomposed', 'karachi', 'kse', 'kse-100', 'capitalisation', '82.3', '79.9', '9221-5685192', 'nwe', 'dulls', 'becalmed', 'repsol', 'puertollano', 'refinery', 'functioning', 'manuel', 'prieto', 'gasoline', 'notionally', 'sagging', 'nymex', 'arbitrage', 'eurograde', 'barges', '207', 'fob', 'ara', 'amsterdam-rotterdam', 'sentiment', 'outright', 'heating', '400,000', '0-50', 'bearish', 'listless', 'bids', 'scarce', 'shaxson', '8167', 'prairies', 'frost', 'winnipeg', 'anywhere', 'grainbelt', 'alberta', 'meteorologist', 'gerald', 'machnee', 'sprague', 'manitoba', '39.2', '2.0', '5.0', 'windspeed', 'sky', 'moisture', 'freezing', '32.0', 'battleford', 'sask', '41.0', 'grande', 'alta', '44.6', 'proponents', 'moon', '12.0', '30.0', 'gras', '204', '947', '3548', 'brush', 'beryllium', 'lawsuits', 'pro-active', 'workplace', 'ailment', 'affects', 'immune', 'susceptible', 'remaining', 'suits', 'liability', 'typically', 'covered', 'timothy', 'reid', 'filings', '1990-95', 'vigorously', '18-7/8', '216-579-0077', 'salomon', 'refiner', 'q3', 'ting', 'refiners', 'refining', 'margins', 'third-quarter', 'diamond', 'shamrock', '0.38', '0.73', 'versus', '0.63', '0.85', 'tosco', '0.95', '1.03', '0.94', '0.46', '0.33', 'valero', 'energy', '0.27', 'presale', 'marion', '3,250,000', '09/04/96', 'nyc', '1200', 'cusip', '569399', 'wv', 'stat:exempt-ult', 'sp', 'na', 'y', 'enhancements', 'qual', 'dtd', '09/01/96', '5/1/98-02', 'sr', 'mgr', 'cpn', '05/01/97', 'non-callable', 'nic', '9/17/96', 'approx', 'wesbanco', 'fairmont', 'l.o.', 'steptoe', 'clarksburg', 'ferris', 'watts', 'charleston', '7,330,000', 'mbia', '3/1/90', '@', '6.14900', '4yrs', '4mos', 'avg', 'bbi-7.27', '575,000', '610,000', '650,000', '685,000', '730,000', 'pre-sale', 'contributed', 'j.j.', 'k-sheets', 'refunding', '290,000', 're', '70,375,000', 'facilities', 'repricing', '9,215,000.00', 'ocasek', 'a1', 'aa-', 'fitch', '08/29/1996', '10/01', '1998c', '125m', '4.20', '6,045,000.00', 'vern', 'riffe', '1998d', '165m', '290m', 'a.g.', 'banc', 's.b.k-', 'seasongood', 'mayer', 'chillicothe', 'shielded', 'whistlestop', 'rode', 'rails', 'ropelines', 'shaking', 'excited', 'hillary', 'rodham', 'huntington', 'rigorous', 'sidwell', 'renominated', 'lady', 'interested', 'drifted', 'depressed', 'aex', '4.54', '556.19', 'topping', '1.90', '58.70', 'ihc', 'caland', '2.40', '80.70', '34.9', '36.6', '37.5', '47.2', 'ex-dividend', '0.60', '52.90', 'nutricia', 'shrugged', 'ex-div', 'soar', '4.10', '214.40', '18.40', '210.00', 'stork', 'follow-through', 'fokker', 'short-lived', '51.00', 'tapie', 'claude', 'lelouche', 'stars', 'philippe', 'seguin', 'resigning', 'eject', 'bankrupt', 'thus', 'ineligible', 'blizzard', 'now-destroyed', 'starring', 'homme', 'femmes', 'mode', \"d'emploi\", 'instructions', 'power-hungry', 'cruel', 'comedy', 'dearly', 'mixing', 'careers', 'artist', 'toubon', 'ejecting', 'stripping', 'procedure', 'reconvene', 'suspend', 'judgement', 'immunity', 'courts', 'rigging', 'appealing', 'drains', 'ffr', 'drained', 'francs', 'repurchase', 'allocate', '44.3', '48.2', '13.4', 'bidders', 'collateral', 'satisfying', '3.4', 'allotted', '30.9', 'rabobank', 'rabn.cn', 'h2', 'co-operative', 'ba', 'herman', 'wijffels', '853', '21.5', '702', 'depend', 'easing', 'underwriting', 'single-digits', '1.43', 'quantify', 'garry', 'ipsos', 'sympathises', 'permits', 'cold-hearted', 'sncf', 'renegotiation', 'bailout', 'upturn', 'atria', 'foodstuffs', 'oy', 'year-half', 'january-june', 'appropriations', 'bright-belgians', 'speeding', 'epidemic', 'belga', 'checked', 'amd', 'booked', 'm.p.h.', 'no-confidence', 'debate', 'banharn', 'silpa-archa', 'lacking', 'ethical', 'alleges', 'corrupt', 'accusations', 'convenient', 'accusation', '13-month-old', 'six-party', '209', 'seats', '391-seat', 'infighting', 'chart', 'fix', 'fontaine', '6mth', '3.17', '231', 'fashion', 'wigs', 'coconut', 'associations', 'philippines', 'cif', 'prev', 'julaug', '775', '787.50', 'unq', 'augsep', '752.50', '758.75', 'sepoct', '733.75', '743.50', 'octnov', '740', 'novdec', '732.50', 'aronkasei', 'nomura', 'downgraded', 'three-grade', 'assigns', 'direction', '225-share', 'presse', 'langage', 'temps', 'beja', 'ekeus', 'unscom', 'oficials', 'tareq', 'aziz', 'inspectors', 'shuttled', 'detection', 'disarming', 'destruction', 'prerequisite', 'crippling', 'invading', 'ticket', 'altogether', 'weaken', 'harb', 'omar', 'karame', 'backwards', 'redistribution', 'locations', 'occupied', 'alimentary', 'splitting', 'syrian-lebanese', 'maltese', 'cheating', 'complain', 'over-charging', 'in-nazzjon', 'discipline', '365,000', '195,000', '80,000', 'congested', 'l-orizzont', 'alfred', 'sant', 'vat', 'tamils', 'demonstrate', 'demonstrated', 'nadarajah', 'muralidaran', 'swiss-based', 'tiger', 'extortion', 'ltte', 'eurobourses', 'recovers', 'santorelli', 'bourses', 'clawing', 'unsteady', 'uncertainty', 'tankan', 'three-day', '0.3', 'bargain-hunters', 'ftse', 'patchy', 'culminating', '3,911', 'fuelled', 'unsettled', 'stronger-than-expected', 'pulling', 'treasuries', 'relinquished', 'doldrum', 'ackerman', 'strategist', 'fahnestock', 'consequently', 'swings', 'floor', 'computerised', 'ibis', '0.4', 'chemical', 'fundamentals', 'fantasy', 'unease', 'franc', '3.4210', 'squeezed', 'jitters', 'malaise', 'regain', 'evaporate', '0.5', 'pressured', 'currencies', 'emu', '1.4788', '107.74', '1.4789', '107.55', 'times-stock', '3,905.7', '2.43', '2,017.99', '30-share', 'dax', '6.48', '2,558.84', 'precious', '388.55', '388.75', '5.24', 'stansted', 'iraqis', 'diverted', 'british-based', 'sadiki', 'trace', 'contacted', 'north-east', 'explosives', 'batches', 'jordanians', 'saudis', 'eco', 'builders', 'edna', 'fernandes', 'ecological', 'warfare', 'corporates', 'hurts', 'eco-terrorism', 'tarmac', 'costain', 'conglomerate', 'targeted', 'activist', 'harmless', 'ragbag', 'hippies', 'harding', 'aggregates', 'mobile', 'phones', 'communicate', 'gather', 'demos', 'protestor', 'codename', 'full-scale', 'emphasise', 'terror', 'newbury', 'bypass', 'intimidation', 'picketing', 'underground', 'cryptic', 'elves', 'leaflets', 'larger', 'earth', 'ours', 'm3', 'twyford', 'campaigning', 'broader', 'stopping', 'out-of-town', 'pollution', 'road-building', 'primarily', 'tendering', 'realise', 'environmental', '3-4', 'forms', 'tangible', 'intangible', 'publicity', 'protesting', 'tales', 'tenders', 'contractors', 'suppliers', 'quarries', 'supplier', 'protestors', 'invade', 'knock-on', 'investement', 'ubs', 'phenomenon', 'evaluates', 'methods', 'involve', 'wide', 'razor-thin', 'overcapacity', 'stagnant', 'tale', 'woe', 'carnival', 'spirits', 'notting', 'revellers', 'singing', 'dancing', 'stabbings', 'ugly', 'scenes', 'scar', 'festival', 'festivities', 'good-natured', '1976', 'darker', 'slowly', 'recovering', 'shopkeepers', '248', 'annex', '2.9', 'fake', 'sudradjat', 'djiwandono', '5.4', '43-year', '2,341', 'divided', 'cart', 'olazabal', 'seve', 'ballesteros', 'motorised', 'rheumatoid', 'pairs', 'decides', 'ryder', 'commitee', 'unhelpful', 'precedent', 'olly', 'dispensations', 'feasible', 'carts', 'prohibited', 'warzycha', '46th', 'kostas', 'malekos', 'resigns', 'kirkcaldy', 'managerial', 'casualty', 'resigned', 'directors', 'relinquish', 'regrettably', 'accordingly', 'pride', 'intact', 'agreeing', 'griqualand', 'kimberley', '18-18', '6-10', 'maltch', 'cloete', 'wath', 'boeta', 'wessels', 'mcleod', 'glen', 'osborne', 'halford', 'endeavours', 'whilst', 'divisionn', 'three-match', 'outs', '396', '79.20', '59.33', '190', '113', '38.00', 'nasser', '37.00', '32.40', '159', '31.80', '41no', '25.50', 'ealham', '11.60', '10no', '9.75', '6.00', 'caddick', 'graeme', 'hick', 'maidens', '57.2', '165', '27.50', '36.16', '150.3', '377', '37.70', '42.00', '47.4', '62.50', '69.00', '81.00', '61.2', '221', '110.50', '264', '264.00', '158', '79.00', '141', '68.80', '195', '100no', '65.00', '320', '148', '64.00', '60.33', 'latif', '45.00', '38.50', '30.00', '24.50', 'shadab', 'kabir', '21.75', 'ata-ur-rehman', '26.29', '26.93', '31.81', '48.4', '173', '34.60', '71.00', 'underlined', 'consistency', 'keith', 'fletcher', '29,434', 'selector', '1,429', '64.95', 'no-one', 'argue', 'appreciate', 'headbutt', 'miron', 'cozma', 'headbutting', 'bosses', 'miners', 'lei', '3000', 'danut', 'lupu', 'rioted', 'reformist', 'petre', 'petrosan', 'tunnel', 'skirmish', 'tall', 'tallest', 'towering', 'cms', 'squash', 'jansher', 'pakistnn', 'brett', '14-17', '13-15', 'cairns', 'del', 'harris', '7-15', 'chaloner', 'frenz', '12-15', '15-4', '15-14', 'kneipp', 'faizy', 'mir', 'zaman', 'gul', 'meads', 'thoren', '8-15', 'extends', 'topples', 'champ', 'vintage', 'toppling', 'illustrious', 'serve-and-volley', '30-year-old', 'retire', 'volleyed', 'grace', 'jimy', 'szymanski', 'sprained', 'romp', 'pavel', 'fellow-american', 'wiesner', 'iva', 'majoli', 'fifth-', 'sidelines', 'rita', 'alexia', 'dechaume-balleret', 'ellwood', 'mariaan', 'swardt', 'dominique', 'roost', 'florencia', 'labat', 'rinaldi', 'stunkel', 'angelica', 'gavaldon', 'paola', 'suarez', 'marianne', 'werdel', 'witmeyer', 'grossman', 'silvia', 'farina', 'caldwell', '5-', 'adriana', 'serra-zanetti', 'wagner', 'gigi', 'kristie', 'boogert', 'joannette', 'laxmi', 'poruri', 'filippo', 'veglio', 'ruud', 'jabali', 'campana', '4-', '17-', 'radka', 'bobkova', 'kschwendt', 'kleinova', 'annabel', 'capriati', 'arendt', 'cacic', 'likhovtseva', 'kyoko', 'nagatsuka', '7-', 'pam', 'shriver', 'kimberly', 'po', 'ruano-pascual', 'tina', 'kirzan', 'rika', 'hiraki', 'langrova', 'tami', 'whitlinger', 'cecchini', 'francesca', 'lubiani', 'tamer', 'sawy', '7-9', 'amy', 'frazier', 'larisa', 'neiland', 'lisa', 'lori', 'mcneil', 'dopfer', 'zina', 'garrison', 'sawamatsu', 'rennae', 'stubbs', 'miriam', 'oremans', 'zrubakova', 'pozzi', 'skoch', '.508', '.595', '.526', '.402', '.492', '.434', 'vanlandingham', 'glenallen', 'first-inning', '8-13', 'concentrated', 'andres', 'galarraga', 'extra-base', 'rain-shortened', 'seven-inning', 'arthroscopic', 'benes', 'royce', 'clayton', '14-9', 'one-half', '12-11', 'art', 'howe', 'intentionally', 'lined', 'elbow', '20-6', 'eldred', '5-1/3', 'miranda', 'batter', 'thome', 'nagy', 'three-hitter', 'felipe', 'left-field', '29th', 'joe', '10-game', 'enjoying', '186th-ranked', 'tiebreaker', 'hottest', '16-2', 'hardcourts', 'nerves', 'talented', 'hurried', 'stomach', 'week-old', 'sushi', 'combination', 'undone', 'revenge', 'breezy', 'erratic', 'untidy', 'unforced', 'walloped', 'woeful', 'faults', 'deflating', 'fault', 'confusion', 'awarded', 'umpire', 'barely', 'frittered', 'risen', 'stray', 'spate', 'withdrawals', 'lacklustre', 'trail', 'recruits', 'fluidity', 'proved', 'parries', 'lie', 'riedle', 'tretschok', '77th', 'decheiver', '48,800', 'balakov', 'hagner', '85th', '31,139', 'schulz', '24,800', 'donkow', '33,230', 'jeffrey', 'roest', 'korneev', 'hansma', 'hockey', 'ville', 'peltonen', 'ylonen', 'teemu', 'selanne', 'jyrki', 'lumme', 'janne', 'ojanen', '23rd', 'ruuttu', 'radek', 'bonk', 'reichel', 'dopita', 'cyprien', 'nine-month', 'xamax', 'jean-pierre', 'post-match', '8,400', 'punches', 'claudio', 'moura', 'intervene', 'succeeded', 'kneeing', 'hegi', 'elbowed', '840', 'facchinetti', 'astonished', 'gress', 'shocking', 'verbally', 'provoked', 'punished', 'scuffle', 'punch', 'react', 'bugno', 'doping', 'gianni', 'testing', 'testosterone', 'hormone', 'subsequent', 'higher-than-average', 'naturally', 'giro', \"d'italia\", 'stimulant', 'caffeine', 'colonna', 'haarlem', 'kilometre', 'gouda', 'federico', 'mapei', 'mins', 'secs', 'robbie', 'mcewen', 'jans', 'koerts', 'palmans', 'teutenberg', 'postal', 'steels', 'endrio', 'leoni', 'aki', 'capiot', 'collstrop', 'braber', 'neths', 'blijlevens', 'tvm', 'wolf', 'foreldorado', '0:04', '0:06', 'corini', '0:07', 'omloop', 'motorola', '0:08', 'tristan', 'hoffman', 'hincapie', '0:09', 'talen', '0:10', 'cofinec', 'slips', 'emese', 'bartha', 's.a.', 'rebound', 'gabor', 'sitanyi', 'london-based', 'barings', 'french-registered', 'floated', 'hovered', '6,425', 'forints', 'depositary', 'receipts', 'oversubscribed', 'deadline', '5,800', 'one-third', 'two-fifths', 'tamas', 'erdei', 'budapest-based', 'abn-amro', 'hoare', 'govett', 'macroeconomic', 'generates', 'plunged', 'understands', 'capita', 'consumption', 'folding', 'krpaco', 'ownership', 'pse', 'czk', '000', 'agrotonz', 'tlumacov', '336.47', '59440', '19999.777', 'avia', '290.00', '700', '203.000', 'barum', '171.00', '14432', '2467.872', 'ceska', 'sporitelna', '335.00', '375.00', '533153', '198354.941', 'ckd', '369.66', '384.00', '5565', '2065.260', 'emkam', '34684', '867.100', 'kablo', 'kladno', '960.00', '2230', '2140.800', 'komercni', 'banka', '2320.00', '2370.00', '7000', '16408.700', 'leciva', '2470.00', '1360', '3359.200', 'metrostav', '3024.95', '9074.850', 'morav.chemic.', 'zav', '637.50', '1626', '1036.575', 'okd', '111.50', '112.56', '95975', '10752.092', 'pf', 'iks', 'kb', '156.00', '6000', '936.000', 'rif', '900.00', '5500', '4950.000', 'seliko', '4000.00', '20000.00', '3565', '32607.500', 'sokolovska', 'uhelna', '785.00', '4710.000', 'spif', 'cesky', '339.00', '340.00', '7546', '2562.094', 'spt', '3355.00', '3404.71', '10700', '36337.137', 'skoda', '1045.56', '1060.00', '10772', '11361.330', 'tabak', '6700.00', '6700.000', 'trinecke', 'zelezarny', '630.000', 'vodni', 'stavby', '1915.00', '3830.000', 'slows', 'after-hours', 'worldcom', 'mfs', '1-3/4', '3-8/16', '41-5/16', '5,700', '53,400', '4,153,800', 'cboe', 'valued', 'suggest', 'unusual', 'certainly', 'steadily', 'mid-august', 'derivatives', '312', '408-8750', 'e-mail', 'derivatives@reuters.com', 'faulding', 'patent', 'elizabeth', 'n.j.', 'purdue', 'frederick', 'infringement', 'purepac', 'pharamceutical', 'kadian', 'sustained', 'morphine', 'merit', 'zeneca', 'f.h.', 'mick', '36-year-old', 'first-team', 'omitted', '20-man', 'kernaghan', 'daish', 'kelly', 'elland', 'experimental', 'shay', 'denis', 'irwin', 'babb', 'kenna', 'breen', 'harte', 'cunningham', 'staunton', 'townsend', 'houghton', 'gareth', 'farrelly', 'mcloughlin', 'mcateer', 'cascarino', 'niall', 'quinn', '+6613377', 'killer', 'murders', 'eugene', 'colonel', 'commanded', 'wiped', 'smerdon', 'nuns', 'garang', 'spla', 'urgently', 'nuour', 'marial', 'mapourdit', 'hindering', 'recruitment', 'interpretation', 'compound', 'sisters', 'moira', 'batchelor', 'barton', 'riel', 'sister', 'maureen', 'carey', 'raniero', 'iacomella', 'captives', 'kenyan', 'attributed', 'detentions', 'learned', 'monsignor', 'caesar', 'mazzolari', 'apostolic', 'diocese', 'rumbek', 'isolation', 'looted', 'animist', 'arabised', 'postpones', 'pressed', 'register', 'well-organised', 'coerce', 'inform', 'districts', 'conquered', 'ethnically', 'cleansed', 'hinted', 'flagrant', 'fo', 'administer', 'waits', 'kuznets', 'finalising', 'arranged', 'vyacheslav', 'tikhomirov', 'materialise', 'rebuffed', 'suggestion', 'band', '10.45', '0645', 'guldimann', 'tikhomirov-maskhadov', '20-month-old', 'falter', 'ria', 'indicated', 'agencies', 'hinting', 'protege', 'lesson', 'profile', 'reelected', 'prompting', 'rumoured', 'weakening', 'aides', 'insisting', 'apart', 'spelled', 'intensify', 'reinforced', 'determination', 'aleksander', 'kwasniewski', 'kucan', 'strengthening', 'bloc', 'comprises', '142.3', '118.8', 'janez', 'drnovsek', 'nationalists', 'iliescu', 'impeachment', 'ion', 'punr', 'electioneering', 'pdsr', 'nastase', 'unexpectedly', 'admission', 'vexed', 'ministries', 'gheorghe', 'funar', 'impeached', 'treason', 'compromising', 'oust', 'succeed', 'oppose', 'estonian', 'mps', 'electing', 'belinda', 'goldsmith', 'tallinn', 'lennart', 'meri', 'pushing', 'oversaw', 'statehood', 'arch-rival', 'ruutel', 'votes', '101-member', 'garnered', 'reconvened', 'ceded', 'favoured', 'heiki', 'kranich', 'constitution', 'smoothe', 'periods', 'parliamentarians', 'leftist-led', 'inched', 'constant', 'convene', '101', '273', 'emerges', 'garner', 'enn', 'markvart', 'invalid', 'abstentions', 'convened', 'abusing', 'shameful', 'acts', 'adnan', 'xhelili', 'wiltshire', 'adriatic', 'durres', 'divorced', 'befriended', 'reminded', 'heterosexual', 'homosexual', 'begging', 'impoverished', '1300', 'popularity', 'laca', 'sensational', 'difficulty', 'filmed', 'rudolf', 'gajdos', 'interpol', 'eva', 'boudova', 'interrogated', 'pornographic', 'films', 'suspicions', 'rape', 'detectives', 'disappearances', 'serial', 'urals', 'perm', 'raped', 'identify', 'waited', 'touches', 'reminds', 'commandments', 'posters', 'offices', 'quarracino', 'sermon', 'cleric', 'biblical', 'commandment', 'thou', 'shalt', 'free-market', 'eletropaulo', 'eduardo', 'bernini', 'sobral', 'secretariat', 'romina', 'nicaretta', '5511', '232', '4411', 'victims', 'alvarado', 'hurte', 'sierd', 'zylstra', 'jetsi', 'hendrika', 'coers', 'teak', 'plantation', 'schutte', 'aspect', 'hand-written', 'ebe', 'huizinga', 'abductors', 'cvg', 'privatization', 'caracas', 'swell', 'corporacion', 'venezolana', 'guayana', 'proceeding', 'machuca', 'sidor', 'union-based', 'steel-producing', 'venalum', 'alucasa', '13,000', 'layoffs', 'unionized', 'lugo', '582', '834405', 'drunks', 'lovebite', 'bandit', 'drinkers', 'lovebites', 'drunken', 'stupor', 'dreaded', 'chupabolos', 'drunksucker', 'preys', 'matagalpa', 'placing', 'hickey-like', 'nuevo', 'diario', 'enraged', 'machismo', 'so-far', 'culprit', 'surrounding', 'vagrants', 'slept', 'gripping', 'desserts', 'bolos', 'drunkards', 'beautiful', 'banespa', 'prior', 'globo', 'liquidated', 'temporary', 'restructure', 'privatized', 'refinance', 'covas', 'reais', 'delicate', 'solved', 'bamerindus', '90-day', 'tbc', 'loan', 'fourth-largest', 'troubles', '55-11-2324411', 'havel', 'vaclav', '15-21', 'henrique', 'cardoso', 'cities', 'manaus', 'chancellor', 'benevolent', 'alejandro', 'lanusse', '1971', '1973', 'domingo', 'peron', 'predecessors', 'ongania', 'levingston', 'steered', 'peronists', 'hector', 'campora', 'solano', 'adversories', 'imprisoned', '1951', 'coup', 'menendez', 'gradual', 'left-wing', 'activism', 'culminated', 'autobiography', '1918', 'married', 'ileana', '1935', 'collision', 'liner', 'liaoning', 'tiantan', 'dalian', 'tianjin', 'matahari', 'revises', 'putra', 'prima', 'hanifah', 'komala', '+6221', '384-6364', 'china-bound', 'ki-choo', 'jiaxuan', 'atheist', 'nominally', 'teachers', 'remote', 'attract', 'nabs', '10-year-old', 'immigrant', 'sneaked', 'jiangsu', 'passerby', 'apartment', 'immigrants', 'overstayed', 'mainland', 'reverts', 'hasan', 'muratovic', 'bosnians', 'suleyman', 'demirel', 'tansu', 'ciller', 'barkho', 'organising', 'secretary-', 'gualtiero', 'fulcheri', 'zejjari', 'ascertain', 'equitable', 'procured', 'u.n', 'employ', 'iraq-u.n.', 'memorandum', 'understanding', 'partial', 'separating', '1960', 'somalia', 'dodge', 'steers', 'heifers', '4,200', 'contracted', 'formulated', '408', '8720--', 'anti-abortion', 'praises', 'democrat', 'tolerance', 'elsner', 'pro-abortion', 'views', 'hall', 'conscience', 'recognizes', 'welcomes', 'divergent', 'inclusiveness', 'organizers', 'casey', 'vehement', 'intolerance', 'pro-woman', 'pro-child', 'pro-life', 'deliver', 'podium', 'deaf', 'ears', 'abortions', 'dilemma', 'insert', 'recognizing', 'validity', 'passionate', 'kate', 'michelman', 'disdain', 'punishment', 'cynthia', 'mckinney', 'flooded', 'montana', 'bushel', 'noteworty', 'durum', 'jumping', '14-pct', 'protein', 'wheats', 'chg', '5.06', '.02', 'unc', 'duluth', '---', 'hunter', '4.46', 'dn', '5.00', 'hrw', '12pct', 'billings', 'mt', '4.62', '.01', '.10', 'rudyard', '4.41', 'portland', '5.1700', 'pendleton', '4.7300', 'coolee', '5.13', '4.7000', 'waterville', '5.05', '4.6200', 'wenatchee', '5.15', '4.7200', 'nc=acomparison', 'na=not', '312-408-8720', 'vmig-1', '08/23/96', 'rec', 'bd', 'ref', 'ymca', 'proj', 'ser', 'vmig', '3,390,000', '08/28/96', 'lauds', 'troop', 'welcome', 'dialogue', 'mashadov', 'single-a', '08/26/96', 'oh', '6,310,000', 'stallone', 'fiancee', 'sylvester', 'flavin', 'publicist', '7-pound', '4-ounce', 'sophia', 'bloch', 'wonderful', 'rambo', 'copland', 'jumps', 'abc', 'challenger', 'stretching', 'whistle-stop', 'perot', '47-38', '1,002', '824', 'opting', '48-43', 'fulfil', '26-57', 'bulk', 'millfeeds', 'millfeed', 'high-priced', 'flour', 'mixer', 'ton', 'barley', '140', 'mixers', 'closely-watched', '312-408-8720--', 'puerto', 'rico', 'hairy', 'surgical', 'dark-brown', 'patch', 'skin', 'abyss', 'dejesus', 'nevus', 'journals', 'ostracism', 'gradually', 'expanding', 'transplanting', 'afflicted', 'norris', 'balloons', 'forehead', 'shoulders', 'filling', 'saline', 'inserted', 'treatments', 'eau', 'claire', 'wisc', 'baird', 'waterworks', '5.2893', 'realtors', '4,464', 'single-family', '4,570', '206,464', 'condominium', '24.8', 'condos', 'nudged', '1.0', '123,394', '8.25', '8.32', '7.03', '617-367-4106', 'amtrak', 'derails', 'montpelier', 'vt', 'vermonter', 'albans', 'vermont', 'd.c.', '7:51', 'roxbury', 'garrity', 'pudvah', 'trauma', 'understood', 'conductor', 'passangers', 'reservations', 'uninjured', 'springfield', 'northfield', 'paralympics', 'gloomy', 'france-juppe', 'handicapped', 'paralympic', 'gloom-stricken', 'scepticism', 'opposite', 'july-august', 'medals', 'pessimistic', 'stagnates', 'unemployement', 'near-record', 'blue-chip', 'foray', 'sbf-120', '1.19', '1,421.90', 'actively', 'cfdt', '500,000', 'syndicale', 'unitaire', 'fsu', 'austerity', 'unveiled', 'anxieties', 'niggled', 'centime', '3.4211', 'heavyweights', 'elf', 'rhone', 'poulenc', 'eurotunnel', 'morose', 'post-holiday', 'uic', 'gan', 'slid', '12.19', '55.1', '758', 'recapitalisation', 'carrefour', '2.19', '2,616', 'cheuvreux', 'virieu', 'reinsurance', 'scor', 'prudential', 'mercantile', 'bollore', '2.4', '73.83', 'scac', 'delmas', 'vileujeux', 'sdv', 'alcatel', 'alsthom', '395.0', 'opthalmic', 'essilor', '1,328', 'oakley', 'non-prescription', 'gentext', 'optics', 'veerakesari', 'telo', 'trincomalee', 'chavakachcheri', 'jaffna', 'sentries', 'thinakaran', 'tulf', 'sivasiththamparam', 'meaningless', 'unp', 'underpriviledged', 'sections', 'society', 'excise', 'w.n.f.', 'chandraratne', 'guidelines', 'liquor', 'licences', 'licence', 'lankadeepa', 'female', 'simultaneous', 'chandrika', 'kumaratunga', 'motorcade', 'divaina', 'cultural', 'sum', 'worn', 'dinamina', 'ruhunu', 'indefinitely', 'hospitalised', '941-434319', 'rupam', 'banerjee', 'tributes', 'legendary', 'poured', 'wean', 'laureate', 'aided', 'breathing', 'woodlands', 'vomiting', 'diagnosed', 'abated', 'irregularly', 'breathes', 'advise', 'fingers', 'familiar', 'six-member', 'treating', 'greetings', 'bouquets', 'pope', 'get-well', 'placard', 'shishu', 'bhavan', 'speedy', 'recovery', 'poorest', 'prostitutes', 'goddess', 'raju', 'statesman', 'mangala', 'das', 'waist', 'prem', 'gift', 'incessantly', 'tarak', 'footpath', 'passers-by', 'immaculate', 'bless', 'scribble', 'prayed', 'bengal', 'religions', 'pray', 'solidarity', 'downtrodden', 'nanda', 'gopal', 'bhattacharya', 'rifkind', 'conferences', 'obey', 'normally', 'interfere', 'protested', 'salvation', 'fis', 'hamas', 'guest', 'denying', 'fundamentally', 'mongolia', 'congressman', 'sayed', 'masood', 'briefed', 'dana', 'rohrabacher', 'wartorn', 'appoint', 'transitional', 'bagram', 'airbase', 'amrollah', 'neutralise', 'afghans', 'hamid', 'ibrahimi', 'feels', 'neutral', 'jalalabad', '1.38', 'rupees', 'auctioned', 'three-', 'five-', '1.126', '44.5', '782.6', 'insurgents', 'sharma', 'centre-right', 'insurgency', 'maoists', 'multi-party', 'negotiates', 'khum', 'bahadur', 'khadga', 'insurgent', 'bhattarai', 'guarantee', 'centrist', 'jointly', 'marxist-leninist', 'uml', 'three-party', 'soy', 'indore', '12,900-13,100', 'soyoil', 'solvent', 'undertone', 'soymeal', '276-277', '246-248', 'rapeseed', 'extraction', 'availability', '3,850', 'bedibunder', '3,800-3,825', 'bhavnagar', '---------------------', 'dewas', '12,700-12,950', '12,900-13,150', '11,900-12,100', 'mandsaur', '12,600-12,750', '12,700-12,850', 'neemuch', 'n.a', 'mhow', '12,700-12,800', '12,750-12,850', 'ratlam', 'ashta', '12,700-12,900', '12,800-13,000', '12,750-12,950', 'dhar', '12,750-12,900', 'ujjain', '12,850-13,050', 'jaora', 'barnagar', 'khandwa', 'ashoknagar', 'nalkhera', '----------------------------------', '30,300-30,400', '30,700-30,800', '32,700-32,800', '32,900-33,000', '--------------------------------', 'rail-for', '9,800', '8,800', 'bedi', 'bunder', '1=35.73', 'humayun', 'rasheed', 'choudhury', 'callers', 'chaired', 'bengali', 'banglabazar', 'patrika', '330-member', '1986-87', 'assemby', 'partisan', 'ineffective', 'resorting', 'instability', 'desireable', 'designs', 'sternly', 'm2', '8.2', '456.8', '439.9', '422.1', 'm1', '144.5', '139.3', '131.7', 'helibor', 'fixing', '3.40', '1-mth', '3.27', '3.29', '2-mth', '3.34', '3-mth', '6-mth', '3.56', '3.55', '9-mth', '3.73', '3.70', '12-mth', '3.89', '3.87', 'barrick', 'arequipa', '36.3', 'tendered', 'ahave', 'realize', 'munk', '30-a-share', 'attractive', 'pierina', 'allocation', 'swallow', 'vancouver-based', 'prospector', 'sweetened', 'batch', 'drill', 'ounces', 'drilling', 'pro-rated', 'penn', 'terminates', 'allentown', 'terminated', 'non-binding', 'merrion', 'licensing', 'license', 'domiciled', '212-859-1610', 'vnu', 'publisher', 'op', '618', '568', '363', '127', '174', 'info', 'miscellaneous', 'pro', 'rata', 'hmg', 'vtm', 'aol', 'online', 'hanover', 'bertelsmann', 'adon', 'schiphorst', 'cebit', 'buettner', 'managing', 'thirds', 'scandanavia', 'benelux', '0172', '6736510', 'hijack', 'eyewitnesses', 'rona', 'a310', '+', '00--44-171-542-7947', 'dtb-bund-future', 'tranches', '02.sep.96-06.mar.97', '95.35', '96.00', '1.16', '97.00', '2.50', '127.10', '98.00', '202.90', '94.00', '101.40', '95.0', '1.33', '1.80', '71.70', '96.0', '1.84', '1.20', '51.80', 'dbrs', 'confirms', 'ratings', 'pfd-2', 'debentures', 'cumulative', 'non-cumulative', 'aa', 'pfd-1', 'intercity', 'roadblock', 'provinces', 'erzincan', 'sivas', 'ablaze', 'confiscates', 'cyprus-based', 'arabic', 'al-tadamun', 'suggesting', 'editor-in-chief', 'liwaya', 'censors', 'expense', 'front-page', 'entitled', 'compliant', 'undergo', 'compulsory', 'psychiatrists', 'capacities', 'behave', 'zionists', 'censorship', 'ipo', 'transkaryotic', 'therapies', 'symbol', 'tktx', 'shrs', '16,668,560', 'underwriter', 'morgan', 'underwriters', 'over-allotment', '375,000', 'hoechst', 'roussel', '357,143', 'platforms', 'gene', 'activation', 'preclinical', '15,400', '2,074', '3,422', 'derailment', 'praise', 'wheelchair', 'mrs.', 'controlling', 'firearm', 'bradys', 'cane', 'rousing', 'reception', 'sat', 'vip', 'felons', 'saluting', 'sportsman', 'remington', 'ak47', 'uzi', 'deserve', 'thumbs', 'deranged', 'impress', 'jodie', 'actress', 'tracking', 'cdu', 'csu', 'spd', 'fdp', 'pds', 'emnid', 'res', '11.0', 'allensbach', '37.2', '32.8', '13.0', '39.0', '40.0', '37.4', '7.3', '12.3', 'forsa', '36.0', '31.0', '43.0', '37.0', '38.5', '32.5', '8.1', '38.1', '32.3', '12.9', '6.3', '36.4', '6.9', 'forschungsgruppe', 'wahlen', '228', '2609760', 'grimwade', '4.30', '0330', 'requests', 'negotiators', 'suggestions', 'mentmore', 'resource', 'archive', 'housewares', 'formerly', 'platignum', 'articles', 'pence', '81.5', 'valuing', '179.5p', '4017', 'tnt', 'glafcos', 'xenos', 'heathrow', 'gatwick', 'handles', 'ruth', 'third-busiest', 'prefer', 'implementing', 'well-rehearsed', 'contingency', '0300', 'intend', 'refuel', 'identity', 'parrot', 'scam', 'perth', 'conman', 'parrots', 'dye', 'birds', 'denham', 'peiris', 'cinnamon', 'ringneck', '14,000', 'impostor', 'fooled', 'pet', 'unknowingly', \"'d\", 'photos', 'authentication', 'dyed', 'feather', 'bird', 'enthusiast', 'bogus', 'informant', 'colours', 'moult', 'motorist', 'tonga', 'unexpected', 'tauranga', 'pothole', 'spun', 'wheels', 'tyres', 'smoke', 'pouring', 'bonnet', 'drink-driving', 'iscovered', 'overstayer', \"nuku'alofa\", 'sbpus', 'seven-day', '14-day', 'cut-off-rate', '15.75', '16.00', '38.43', '218.50', 'embassies', 'missions', 'macedonian', 'korean-related', 'outlawed', 'reunification', 'crushed', 'urgent', 'disarmament-china', 'reaffirmed', 'totally', 'satisfy', 'balanced', 'commentary', 'committing', 'thwarting', 'muted', 'forwarding', 'compromised', 'discussed', 'completion', 'inspections', 'drafts', 'stubbornly', 'uphold', 'deterrence', 'self-imposed', 'moratorium', 'declares', 'poisoning', 'receding', 'mysterious', 'germ', 'sakai', 'hardest', 'o-157', 'bacillus', 'settling', 'naoto', 'kan', '9,500', 'regional', 'osaka', 'deadly', 'bacteria', 'schoolchildren', 'complications', 'indicating', 'peak', 'relieved', 'infected', 'pinpoint', 'infection', 'sanitary', 'standards', 'slaughterhouses', 'meatpacking', 'overhaul', 'compile', 'hygiene', 'aluminium', 'shipments', '8.9', 'mill', '224,609', '222,457', 'beverage', 'reflecting', 'above-average', 'cooler', 'inventories', '75,632', '0.2', '11,525', '11,244', 'downward', '210,622', '210,683', 'upward', '213,989', '213,845', 'pegged', '40,144', 'auto', '15,286', '79,390', 'dipped', '18,867', '81-3', '3432', '6179', 'publicly', 'gratitude', 'bongo', 'thanking', 'technological', 'quashed', 'expressing', 'freedoms', 'drafted', 'censure', 'forum', 'code', 'dissent', 'doomed', '0.05', '7.35', 'three-month-to-three-year', 'sheu', 'yuan-dong', 'jumpstart', 'sluggish', 'half-percentage', 'reductions', '5080815', 'demolition', 'two-hour', 'demolished', 'metre', 'crane', 'bulldozer', 'walls', 'amidst', 'alleys', 'bystanders', 'bulldozed', 'plo-israel', 'lawmaker', 'hashem', 'zighayer', 'closure', 'palestine', 'annexed', 'cede', 'sec', 'adopts', '1996-08-28', 'specialists', 'quotes', 'electronic', 'readily', 'individuals', 'orderly', 'empower', 'compete', 'levitt', 'lindsey', 'improvements', 'commonplace', 'practices', 'existed', 'two-tiered', 'quote', 'robbing', 'malpractices', 'oversight', 'shifts', 'continuous', 'quotations', 'display', 'berkeley', 'reprieve', 'mogul', 'silvio', 'berlusconi', 'mediaset', 'extending', 'plugs', 'void', 'proprietor', 'channels', 'locomotive', 'stationary', 'steyr', 'shunt', 'wagons', 'sidings', 'trapped', 'wreckage', 'treat', 'averted', 'brakes', 'railways', 'apa', 'saskatchewan', 'eyes', 'forge', 'scope', 'pork', 'positioned', 'loewen', 'swp', 'analyzing', 'partnerships', 'subsidy', 'grains', 'shipped', 'integrated', 'units', 'contracting', 'programs', 'monopoly', 'rovereto', 'ninova', '6.72', 'heike', 'drechsler', '6.65', 'fiona', '6.64', '13.42', '13.45', 'giaconi', '13.80', '11.34', '11.53', 'gabi', 'rokmeier', 'sergey', 'makarov', '85.26', '84.20', '81.64', '10.13', '10.18', 'tilli', '10.43', '45.15', 'vaccari', '46.16', 'ochieng', '46.21', 'mariacarla', 'bresciani', '3.85', 'nastja', 'rysich', 'ana', 'fidelia', 'quirot', '58.98', 'letitia', 'vriesde', '2:00.39', '2:00.91', 'kreissig', '2.20', 'kostantin', 'matusevitch', 'buiatti', '2.15', 'kibet', '1:45.24', '1:45.62', 'kibitok', '1:46.09', 'oksana', 'ovchinnikova', '58.94', 'shikolenko', '57.44', '56.70', 'virna', 'angeli', '55.66', 'torshina', '55.99', 'knoroz', '57.02', 'lauren', '49.16', 'bronson', '49.67', 'ridgeon', '49.83', 'kipkosgei', '7:46.91', 'lambruschini', '7:47.78', '7:48.38', 'masters', 'rain-affected', 'collingtree', 'gavin', 'levenson', 'coceres', 'gilford', 'cage', 'emanuele', 'canonica', 'howell', 'hedblom', 'bottomley', 'sellberg', 'joakim', 'haeggman', 'klas', 'fulke', 'gates', 'haglund', 'niclas', 'fasth', 'chistian', 'mcfarlane', 'harwood', 'brenden', 'pappas', 'teravainen', 'velde', 'oyvind', 'rojahn', 'mcallister', 'neal', 'briggs', 'retained', 'one-kilometre', '2.777', 'averaged', '57.345', 'lausgberg', 'eighteen', 'hundredths', 'eijden', '1:04.541', 'heeswijk', 'almere', '195-km', 'zabel', 'telekom', 'zanoli', 'mx', 'onda', '.giuseppe', 'citterio', '.robbie', 'kaspars', 'ozers', '8:22:00', 'giuseppe', 'boardman', '4:13.353', '4:14.784', 'gritson', 'moreau', '4:16.274', 'heiko', 'szonn', '4:21.715', 'collinelli', '4:17.551', 'sandstod', '4:24.660', 'alexei', '4:19.762', 'mariano', 'friedick', '4:20.241', 'time-trial', '02.777', 'lausberg', '1:02.795', 'eiden', 'thuet', '1:04.732', 'grzegorz', 'krejner', '1:04.834', 'ainars', 'kiksis', '1:04.896', 'dimitrios', 'georgalis', '1:05.022', '1:05.219', 'keiji', 'kojima', '1:05.300', 'sharman', '1:05.406', 'escuredo', '1:05.731', 'maclean', '1:05.735', 'meidlinger', '1:05.850', 'mckenzie-potter', '1:06.289', 'masanaga', 'shiohara', '1:06.615', 'zyl', '1:07.258', 'keirin', 'nothstein', '10.982', 'neiwand', 'magne', 'buran', 'hubner', 'gane', 'madison', 'martinelli', 'mcgrory', 'pate', 'kappes', 'carsten', 'betschart', 'risi', 'curuchet', 'immi', 'madsen', 'veggerby', 'galvez-lopez', 'llaneras', 'kotzmann', 'stocher', 'capelle', 'jean-michel', 'monin', 'fulfils', 'prediction', 'ayres', '4,000', '13.353', '4:19.699', '4:17.696', 'amazed', 'proximity', 'indoor', 'perfected', 'obree', 'viral', '4:19.808', '4:21.009', '4:21.454', '4:22.738', '4:24.427', 'gritsoun', '4:26.467', 'l.', '5-67', '105-4', 'chester-le-street', '73-3', 'fowler', 'mcmanaman', 'kishinev', 'scans', 'x-rays', 'chat', 'foolish', 'howey', 'naming', 'gascoigne', 'batty', 'jockey', '21-day', 'irresponsible', 'pontefract', 'leger', 'stayer', 'trigger', 'prominence', 'guineas', 'mister', 'baileys', 'rowing', 'redgrave', 'pinsent', 'coxless', 'thoughts', 'athlete', 'dismisses', 'gatting', 'half-volley', 'square-leg', 'learn', 'stephenson', 'dashed', 'thrid', '1977', 'dismissing', 'chappell', 'hop', '5,200', 'carling', 'guscott', 'rory', 'underwood', 'quartet', 'possess', '244', 'qualities', 'selectors', 'hideo', 'nomo', 'half-game', '13-10', '7-1/3', 'benito', 'santiago', 'amaro', '5-12', 'denny', 'neagle', 'smoltz', '20-7', '14-6', 'devon', 'hutton', 'petkovsek', 'valentine', 'blair', 'gwynn', 'joyner', '34-20', 'eusebio', 'sacrifice', 'comeback', '5-0', 'benched', 'arias', 'smiley', 'one-run', 'armando', 'reynoso', 'bulge', 'larkin', 'one-out', 'mehrtens', 'series-clinching', 'trinations', 'tearing', 'cartilage', 'larsen', 'standby', 'jonah', 'lomu', 'cullen', 'walter', 'josh', 'kronfeld', 'robin', 'olo', 'dowd', 'kwazulu-natal', 'englishman', 'featherstone', 'herschelle', '14-man', 'quadrangular', 'woolmer', 'matured', 'mcc', 'kallis', 'spin-bowling', 'all-rounders', 'nicky', 'boje', 'crookes', 'hansie', 'cronje', 'vice-captain', 'mcmillan', 'kirsten', 'hudson', 'symcox', 'jonty', 'rhodes', 'allan', 'fanie', 'villiers', 'daryll', 'cullinan', 'gibs', '71-57', '40-34', 'alba', 'yuri', 'nikiforov', 'vladislav', 'rodimov', 'donizetti', 'attendence', 'rodney', 'eyles', 'zarak', 'jahan', 'nicol', 'wellings', 'ryan', 'parke', '2-15', 'julien', 'bonetat', 'jonathon', 'barada', '15-13', 'shabana', 'zubair', 'faheem', 'r', '85-82', '36-46', 'best-of-seven', 'kfar', 'sava', 'zafririm', 'holon', 'maccabi', 'haifa', 'petah', 'tikva', 'lezion', 'beit', \"she'an\", 'beersheva', 'herzliya', 'co-world', 'wednesay', 'four-and-a-half', 'clown', 'no-nonsense', 'attitude', 'routing', '99.9', '22-year-old', 'abnout', 'distracting', 'confining', 'tirades', 'peripheral', 'lounge', 'rant', 'entertain', 'businesslike', 'zero', '77-minute', 'slotted', 'odds', '151-to-1', 'preparation', 'destined', 'nainkin', '2-7', '6-8', '.565', '.511', '.356', '.522', '.451', '.568', '.623', '.427', '.549', '.431', 'rewritten', '29th-ranked', 'superstar', 'graf-like', 'efficiency', 'fourth-seeded', 'second-day', 'crushing', 'medalist', 'fifth-seed', '53rd-ranked', 'maggie', 'loser', 'grab', 'semblance', 'ponytail', 'unleashed', 'tie-break', 'feisty', 'tie-breaker', 'point-by-point', 'valuable', '8-1', 'playoff', 'novelty', 'roof', '51,000', '20-metre', 'dull', 'eijkelkamp', '56th', 'jongsma', 'shock', 'henke', 'fifth-placed', 'weathered', 'non-stop', 'whisker', 'away-goal', 'squandered', 'midway', 'fullback', 'albert', 'ferrer', 'julen', 'lopetegui', 'milinko', 'hristo', 'stoichkov', 'barjuan', 'set-piece', 'free-kick', 'athletic', 'calderon', 'bernabeu', 'distinct', '11,000', 'gabrich', 'iwan', 'kluivert', 'tijjani', 'babangida', 'dani', 'parma', 'roma', 'udinese', 'humble', 'empoli', 'wealthy', 'ancelotti', 'enrico', 'chiesa', 'pescara', 'ottavio', 'palladini', 'giampaolo', 'melli', 'palermo', 'bianchi', 'arrigo', 'sacchi', 'cesena', 'cremonese', 'uruguayan', 'nightmare', 'replay', 'cosenza', 'fidelis', 'andria', 'piacenza', 'atalanta', 'lecce', 'genoa', 'sampdoria', 'nocerina', 'newcomers', 'perugia', 'powered', 'sergio', 'zickler', 'acrobatic', '13-times', 'ruggiero', 'rizzitelli', 'feldhoff', 'rhineside', 'spal', 'reggiana', 'lucchese', 'vicenza', 'bologna', 'torino', 'avellino', 'lazio', 'bari', 'monza', 'napoli', 'chievo', 'ravenna', '27,600', '48,000', 'akpoborie', '27,000', 'von', 'heesen', 'hirsch', 'pires', 'marc-vivien', 'foe', 'patrice', 'loko', 'psg', 'guivarch', 'last-gasp', 'aime', 'jacquet', 'parc', 'princes', 'raid', 'hard-won', 'spurred', 'leveller', 'crossbar', 'bounced', 'kader', 'ferhaoui', 'blunder', 'jean-claude', 'nadon', 'vairelles', 'lefevre', 'convincing', 'benoit', 'cauet', 'one-two', 'parisians', 'concede', 'leonardo', 'panama', 'dely', 'valdes', 'shocked', 'canaries', 'hintum', 'waalijk', 'schreuder', '6,150', 'vierklau', 'nooijer', '5,696', 'vurens', 'schultz', '22,434', '56rd', '48,123', '71st', 'etienne', 'mendy', '12,000', 'giuly', 'chaouch', 'rouxel', 'baret', 'colleter', 'sg', 'owens', 'tribute', 'relay', 'jesse', 'promoter', 'rudi', 'thiel', 'hopeful', 'holder', 'namibian', '4x100', 'widow', 'squads', 'jayasuriya', 'dashing', 'sanath', 'nine-wicket', 'comfortably', 'modest', '226-5', 'devastating', 'romesh', 'kaluwitharana', 'man-of-the-match', 'aravinda', 'silva', 'ex-captain', 'chipped', 'stumped', '230-1', 'jadeja', 'ganguly', 'dharmasena', 'kambli', 'dravid', 'srinath', 'w-9', '226', '1-4', '2-57', '3-186', '4-217', '5-217', 'kumble', 'mongia', 'kapoor', 'vass', '9-2-35-0', 'pushpakumara', '6-0-23-0', '10-0-59-1', '10-0-42-0', '10-1-39-1', '5-0-24-0', 'a.de', '1-129', 'asanka', 'gurusinha', 'hashan', 'tillekeratne', 'roshan', 'mahanama', 'kumara', 'chaminda', 'vaas', 'muthiah', 'ravindra', '10-1-40-0', '6-0-47-0', '8-0-33-0', '6-0-29-1', '10-2-51-0', '2.2-0-13-0', '2-0-14-0', 'anil', 'ajay', 'sourav', 'vinod', 'rahul', 'nayan', 'javagal', 'venkatesh', 'ashish', 'princeton', 'lyman', 'bailundo', 'savimbi', 'participated', 'joint-commission', 'quartering', 'reality', 'summon', 'subpoena', 'heal', 'confronting', 'basie', 'smit', 'merwe', 'co-operation', 'compiling', 'harrowing', 'frankness', 'subpoenaed', 'human-rights', 'airplane', 'airliner', '1503', '1203', 'fire-engines', 'cypriot', 'hijacker', 'arch', '1,100', 'bbl', 'exploratory', 'morinville', 'excess', 'trax', 'et', '10-23', 'logged', 'leduc', 'reef', '5,350', 'cometra', '11-13', '590', '64ths-inch', 'choke', '2-25', 'encountered', 'nordegg', 'apache', 'saunders', '14-28', 'depth', '3,800', 'acreage', 'earning', '5,120', '8,320', 'butte', 'garrington', '4-8', 'barrel', 'brumm', '212-859-1710', 'biogen', 'berlex', 'leslie', 'gevirtz', 'counsels', 'schering', 'tempest', 'tube', 'violated', 'orphan', 'avonex', 'ms', 'betaseron', 'types', 'interferon', 'biovest', 'hedaya', 'marketplace', 'chiron', 'inventory', 'fda', 'ophran', 'exclusivity', 'diseases', 'differs', 'beta-1b', 'counsel', 'astrue', 'chabora', 'newark', 'depositions', 'bissell', 'preside', 'balances', 'acct', '5.208', '4.425', '14.828', '15.687', '20.036', '20.112', '5,124.053', '5,122.084', 'shrugged-off', 'codelco', 'salvador', '0.35', '90.20', '90.50', '89.40', '91.05', '90.85', 'lots', 'huw', '212-859-1646', 'cbsa', 'brass', 'servicenter', 'coil', 'size-per-order', 'harleysville', 'qrtly', '0.21', 'enap', 'oriente', 'escravos', 'empresa', 'nacional', 'petroleo', 'ecuadorian', '960,000', '15-18', 'vague', 'supplied', 'seller', 'petroecuador', '50-cent', '1620', '1241', 'iii', '1249-1286', '1260', 'ghibellines', 'retook', 'florentine', 'guelfs', 'monte', 'aperto', '1768', 'francois-rene', 'vicomte', 'chateaubriand', 'romantic', 'seminal', 'memoires', \"d'outre\", 'tombe', '1781', 'settlers', 'pueblo', 'nuestra', 'senora', 'reina', '1824', 'bruckner', 'composer', 'organist', 'symphonies', 'scale', 'masses', '1870', 'napoleon', 'franco-prussian', '1886', 'skeleton', 'canyon', 'arizona', 'geronimo', 'rebellion', 'surrendered', '1892', 'prolific', 'modernist', 'darius', 'milhaud', 'jazz', 'ballet', 'du', 'madame', 'bovary', '1906', 'german-born', 'biologist', 'delbruck', 'physiology', 'genetic', 'infect', '1907', 'edvard', 'grieg', 'peer', 'gynt', 'suite', 'piano', 'concerto', '1908', 'dmytryk', 'crossfire', 'hollywood', 'lovely', 'scout', '1944', 'liberated', 'wilhelmina', '1890', 'abdicated', 'juliana', '1963', 'schuman', '1947-48', '1948-52', '1964', 'forth', 'measuring', '6156', 'ft', '3300', 'majesty', '1965', 'schweitzer', 'theologian', 'philosopher', '1913', 'acclaimed', 'interpretations', 'j.s.', 'bach', 'brotherhood', '1952', 'spitz', 'olympiad', 'e.f.', 'fritz', 'guru', 'author', 'simenon', 'character', 'inspector', 'maigret', 'todor', 'zhivkov', 'embezzling', '15-month', '3,000th', 'equality', 'noise', 'bigger', 'detecting', 'fining', 'violators', 'complying', 'trimmed', 'decibels', 'loudness', 'nevertheless', 'worthwile', 'goschen', 'quieter', 'consultation', 'applied', 'busiest', '1959', 'repositioned', 'detect', '7717', 'beats', 'team-mates', 'redraw', 'union-england', 'exclusive', '135.8', 'kiernan', 'one-dayers', 'christchurch', 'dunedin', 'heels', 'caf', 'inability', 'bangui', 'internationally-sponsored', 'sierra', 'leone', 'examining', 'dossier', 'burundi-central', 'disqualify', 'fast-tracks', 'asylum-seekers', 'fast-tracking', 'dissidents', 'fast-tracked', 'processing', 'referred', 'garrett', 'lambert', 'disposition', 'suppose', 'guess', 'preferential', 'patten', 'post-1997', 'ivorian', 'abidjan', 'lapke', 'populaire', 'questioning', 'confidential', 'voie', 'insulting', 'henri', 'konan', 'bedie', 'asec', 'excessive', 'pardoned', 'incitement', 'disturb', 'freetown', 'leonean', 'foindu', 'fallah', 'sewa', 'overran', 'mano', 'junction', 'tongo', 'ascribed', 'uncontrolled', 'bands', 'ivory', 'ruf', 'chiluba', 'shuffles', 'vacancy', 'zambian', 'shuffled', 'sacking', 'remmy', 'mushota', 'tribunal', 'coffers', 'luminzu', 'shimaponda', 'machungwa', 'fictitious', 'rid', 'payroll', 'sidia', 'ousmane', 'kaba', 'root', 'guinean', 'bribes', 'expenditure', 'whereas', 'hydroelectric', '=1,000', 'uniting', 'squabbling', 'liberian', 'inauguration', 'vice-chairmen', 'alhadji', 'kromah', '150,000', 'orgy', 'looting', 'compliance', 'slaves', '1847', 'crp', 'istafanus', 'elisha', 'shamay', 'o.k.', 'likkason', 'egurugbe', 'ongoing', 'asuu', 'academic', 'universities', 'tafawa', 'balewa', 'four-month', 'detention', 'colonies', 'pleas', 'clemency', 'versions', 'gypsy', 'topolcany', 'elaborating', 'visits', 'sketch', 'murderer', 'identical', 'portrait', 'father-of-three', 'belgians', 'knifeman', 'knifed', 'agnieszka', 'kotlarska', 'u.s.-based', 'modelling', 'versace', 'vogue', 'wyborcza', 'twa', 'booking', 'attacker', 'jerzy', 'intending', 'slip', '1.64', '180.38', '4.38', 'mokhoff', 'alliance-menatep', 'inactivity', 'babayan', 'centrinvest', 'ues', 'unified', 'chips', 'anybody', 'adrs', '0.0817', '0.0822', '8.90', 'gazprom', '0.300', '0.355', '0.445', 'converted', 'investing', 'tightened', 'restricting', 'shareholers', 'mosenergo', '0.958', '0.966', 'rostelekom', '2.56', '2.58', 'lukoil', '9.82', '9.85', 'tolkacheva', 'deportations', 'deporting', 'tritan', 'shehu', 'koha', 'jone', 'deported', 'legalise', '350,000', 'long-standing', 'stumbling', 'bulgarians', 'pre-communist', 'restitution', '96.6', 'abolished', 'soviet-style', '++359-2', '981', '8569', 'vacation', 'staying', 'loudest', 'confusing', 'shiels', 'nagyatad', 'lajos', 'semi-literate', '385', 'bosnian-croat', 'republika', 'srbska', 'override', 'reassert', 'adem', 'hodzic', 'seals', 'bosnia-hercegovina', 'councils', 'invalidated', 'cancellation', 'husein', 'micijevic', 'translators', 'booth', 'seventy', 'mandolina', 'zelic', 'translator', 'ringed', 'szabo', 'studying', 'envelopes', 'inconclusive', 'baltic', '101-strong', 'rebuff', 'toomas', 'savi', 'rosati', 'best-selling', 'marginalised', 'tactical', 'manoeuvre', 'circle', 'unwilling', 'matters', 'chosed', 'harm', 'eastward', 'inevitable', 'resembled', 'soviet-era', 'soars', '1,242.9', '596.5', 'january-may', 'expenditures', '9.50', '7.56', 'end-may', '31.6', '8.26', 'revise', 'pension', 'indexations', '566', '6.0-percent', 'indexation', 'quickened', 'envisaged', '16.98', '20.17', '3.19', 'leu', '3,161', '40-1', '3120264', 'nicaraguans', 'delinquency', 'bernardo', 'arce', 'advised', \"gov't\", 'dodging', 'ernesto', 'samper', 'seem', 'prosecutor-general', 'adolfo', 'salamanca', 'senators', 'myles', 'frechette', 'applauded', 'outcast', 'counternarcotics', 'year-old', 'stemming', 'enthusiastic', 'endorsing', 'lords', 'u.s.-bound', 'penalities', 'prisons', 'contributions', 'quake', 'shakes', 'earthquake', 'richter', '11.16', '1716', 'quepos', 'volcanic', 'seismologicial', 'welcoming', 'santamaria', '1700', 'barrier', 'cvrd', 'shelve', 'doce', 'dutra', 'annulled', 'dedicate', 'schomberg', '55-61-2230358', 'yates', '1996-08-29', '5.79', '6.08', '3.98', '148.29', '133.82', '2.07', '8.63', '7.23', 'franked', 'nov', 'reg', '3.67', '2.78', '2.69', 'depreciation', '3.25', '2.79', 'bartender', '9.68', 'bag', 'hometown', 'commuted', 'halting', 'mechanism', 'uncompromising', 'resolutions', 'necessarily', 'binding', 'blasted', 'amounted', 'concerning', 'korei', 'confront', 'confiscation', 'agrees', '8:00', 'puk-kdp', 'endorse', 'massing', 'centres', 'penetrated', 'reflects', 'aggression', 'safeguarded', 'comfort', 'noble', 'contemplate', 'ina', 'morals', 'abdulsamad', 'hameed', 'contrary', 'blasts', 'ignoring', 'crosson', 'ventura', 'mention', 'outdoor', 'commented', 'laughed', 'anti-drug', 'aggressively', 'flashpoint', 'likened', 'stream', 'missiles', 'needle', 'cigarette', 'poison', 'cocaine', 'marijuana', 'remarks', 'cigarettes', 'well-wishers', 'specifically', 'proposition', '215', 'cultivation', 'medicinal', 'headache', 'ingrown', 'toenail', 'non-political', '20-minute', '12-17', 'year-olds', 'flanked', 'bush', 'balance-water', 'dist', 'cty', 'ks', '45,020,000', '22,040,000', '1996a', '22,980,000', 'rfdg', '1996b', '09/05/1996', '06/01', '12/01', '-------------------------------------------------------------', '665m', '840m', '570m', '605m', '70m', '895m', '600m', '2003', '705m', '795m', '2004', '655m', '90m', '965m', '65m', '2010', '60m', '100m', '2011', '30m', '2012', '20m', '35m', '11,450', 'weigh', 'underpinned', 'persisted', 'declining', 'firming', 'cash-related', 'random', 'spruce', 'tbf', '0.70', '413.20', '369.00', 'jerry', 'bieszk', '312-408-8725', 'wheat--rains', 'planting', 'above-normal', 'plains', 'near-ideal', 'extension', 'irony', 'old-timers', 'dust', 'bowl', '1930s', 'turnabout', 'hodges', 'climatological', '20.19', 'climatologist', 'mosier', 'panhandle', 'beneficial', 'ideal', 'mositure', 'dolly', 'topsoil', 'adequate', '816', '561-8671', 'settles', 'jacksonville', '19.4', 'portfolios', 'thrifts', 'discontinued', 'installment', 'amoco', 'yemen', 'sharing', 'shabwa', 'dietsch', 'mees', 'production-sharing', 's-1', 'exploring', 'deferring', 'yemeni', 'amoco-yemen', 'contractor', 'potentially', 'oilfields', 'encyclopedia', 'ludwig', '1633', 'defends', 'hostile', 'evelyn', 'leopold', 'lashed', 'windfall', 'army-run', 'lengthy', 'nsanze', 'terence', 'tanzanian', 'julius', 'nyrere', 'unsympathetic', 'buyoya', 'tutsi-run', 'bind', 'gratuitous', 'immolation', 'mothusi', 'nkgowe', 'coups', 'dump', 'heap', 'justification', 'legitimate', 'discussion', 'impose', 'suggests', 'impede', 'chilean', 'cautious', 'defend', 'exposed', 'terroritsts', 'somavia', 'unarmed', 'inaction', 'indiscriminate', 'inderfurth', 'unconditional', 'berne', 'cantons', 'eoe', '1605', '83,008', '60,131', '22,877', '7,391', '5,658', '15.72', 'ahold', '7,190', '1,123', '10.01', 'bolswessanen', '4,420', '705', '6.17', 'abn', 'amro', '3,003', '1,940', '5.95', '3,853', '673', '5.45', '3,060', '843', '4.70', '020-504-5040', 'sucks', 'seven-year-old', 'cheques', 'ventilation', 'pipe', 'canard', 'enchaine', 'sucked', 'confederate', '113.00', 'eksportfinans', 'suedwest', '3.60', '1.75', 'economists', 'suisse', 'flat', '0.6', 'conf', '113.02', 'comi', 'medium-term', '109.45', '97.82', '4-1/2', '2006', '101.80', '4.252', '+41', '631', '7340', 'anti-bhutto', 'marched', 'removal', 'benazir', 'bhutto', 'zardari', 'nawaz', 'sharif', 'muslim', '16-party', 'nepotism', 'colourful', 'chanting', 'anti-government', 'balochistan', 'quetta', 'extra-judicial', 'youths', 'mohajir', 'mqm', 'turn-out', 'mobilised', 'turbulent', 'calmer', 'speaks', 'urdu-speaking', 'migrated', 'descendants', 'disaster', 'dislodge', 'holy', 'acc', 'apr-jul', 'april-july', '2.93', 'nani', 'palkhivala', '3.14', 'april-march', '3.01', 'grinding', '275,000', '1994/95', '77.79', '87.45', 'inadequate', 'infrastructural', 'shortages', 'achieved', '9.4', 'retaining', 'wsrl', 'kredietbank', 'welspun', 'stahl', 'rohren', 'part-finance', 'submerged', 'welded', 'pipes', 'maturing', 'indusind', 'uti', 'gujarat', '175,000', 'annum', 'longitudinal', 'spiral', 'yarn', 'towels', 'polyester', 'fishermen', 'p.v.', 'krishnamoorthy', 'rameswaram', 'mid-sea', 'accosts', 'arulanandam', '850', 'nadu', 'tamil-speaking', 'karunanidhi', 'influx', 'officals', 'impounded', 'trawlers', 'licenses', 'bose', 'assurance', 'revoke', 'coerced', 'palk', 'pesalai', 'fish', 'chinnathambi', 'unfair', 'penalise', 'fisheries', 'enforce', 'pomfret-rich', 'offerings', 'bales', 'vw', 'carmaker', 'adelt', 'passat', 'sedan', 'gilardi', 'miltiadis', 'evert', 'alexandroupolis', 'nd', 'businessmen', 'depart', 'unleashing', 'seven-point', 'merchants', 'professionals', 'pensions', '600', 'drachmas', 'absorption', 'evasion', 'accelerate', 'component', 'pushes', 'griffiths', 'chip', '3921.8', 'rebounded', 'jeopardise', 'tie-up', 'link-up', 'better-than-expected', 'non-eu', '506', '788', '1.12', '1.4', 'nonetheless', 'buoyed', '2,563.16', '4.32', 'viannet', 'communist-led', 'cgt', 'firmer', '108.40', 'gauge', 'rock-bottom', 'boj', 'predictions', 'improving', 'backbone', 'spectacular', 'breakout', 'baader', 'slippage', 'faltering', '1.4765', '107.78', '1.4779', '3,920.7', '15.09', '2,002.9', '388.50', '521.15', '1=.6421', 'aei', 'iso', '9002', 'twenty-second', 'accreditation', 'veritas', 'accredited', 'iberfreight', 'alicante', 'bilbao', 'seville', 'valencia', 'wafa', 'stupidity', 'strongest', 'expand', 'kiryat', 'sefer', 'demolishing', 'idiots', 'stupid', 'withdrawing', 'hurting', 'bethlehem', 'cater', 'labourers', 'al-aqsa', 'christians', 'bombings', 'halves', 'abandoning', 'diplomacy', 'bells', 'mahmoud', 'abbas', 'mazen', 'dore', 'promises', 'pressing', 'long-delayed', 'hebron', 'redeployment', 'yitzhak', 'mordechai', 'omer', 'akbel', 'prodi', 'tunceli', 'fsa', 'qualifies', 'muni', '2.44', 'ansgar', '3.334', 'obligation', 'avalon', 'borough', 'gos', 'seaford', 'n.y.', '6.31', 'colo', 'taxable', 'aa2', 'fac', 'auth', 'assoc', '4,300,000', 'lamm', 'ticket-cnn', 'cnn', 'competed', 'three-term', 'vied', 'disillusioned', 'horizons', 'donaldson', 'lufkin', 'jenrette', '35-7/8', 'payout', '0.69', '408-8787', 'mull', 'vowinkel', 'appeals', 'reorganisation', 'chiate', 'reinsure', 'liabilities', 'equitas', '1100', 'rowland', 'litigation', 'chairmen', 'gale', 'norton', 'immunizes', 'seeks', 'rescision', 'alternate', 'remedy', 'individually', 'rejection', 'forfeiting', 'risking', 'rejecting', 'gestures', 'bavarian', 'detail', 'nuremberg-based', 'duty', 'prosecutors', 'adolf', 'infamous', 'prosecute', 'gun-wielding', 'pistol', 'overtook', 'photographed', 'potsdam', 'nerve', 'coercion', 'file', 'degrading', 'lets', 'commit', 'clerk', 'u', 'indecency', 'performing', 'sadistic', 'torture', 'oral', 'fanfare', 'alerted', 'packages', 'sep', 'archaeological', 'reppas', 'theodoros', 'pangalos', 'coincide', 'celebrations', 'components', '756', '829', '876', '933', '1.07', '0.98', '657', '1.00', '1.09', '2.37', '2.01', 'refer', 'cavorting', 'ducruet', 'bodyguard', 'naked', 'poolside', 'tremila', 'gente', 'undressing', 'embracing', 'sunbed', 'explicit', 'fili', 'houteman', 'dancer', 'cabaret', 'principality', 'rainier', 'disapproved', 'caroline', 'villefranche', 'cameras', 'sound-track', 'almeida', 'saxony', 'ip', '804', 'acucar', 'auchan', '805', 'camat', 'agf-iart', '806', 'clears', 'billa', 'rewe-handelsgruppe', 'anita', 'gradin', 'exploitation', 'stockholm', 'eurostat', '51/96', 'march-may', 'tomato', 'warriors', 'bunol', 'pelted', 'armfuls', 'ripe', 'tomatoes', 'coated', 'blood-red', 'firework', 'fruit-throwing', 'frenzy', 'hurl', 'occasion', 'historians', '1945', 'disgruntled', 'locals', 'spontaneously', 'bombard', 'fiesta', 'boo-nee-ol', 'fame', 'grown', 'imerisia', 'pre-election', 'heats', 'includind', 'pasok', 'scrambles', 'slaps', 'coupons', '12.70', 'upcoming', 'kathimerini', 'inflows', 'post-election', 'subway', 'snags', 'overshoot', '520', 'lighten', 'kerdos', 'vows', 'mesures', 'kicks', 'yannos', 'papandoniou', 'drachma', 'constantine', 'mitsotakis', 'shake', 'naftemboriki', 'annually', 'georgiopoulos', 'hoek', 'loos', '28.9', '24.5', '273.6', '290.3', '44.4', '40.7', 'gases', '13.26', 'stagecoach', 'swebus', 'principle', 'stg-plus', 'vendors', 'see-saw', '0515', 'ninety-day', '9.93', '90.18', 'samurai', 'eurokiwi', 'issuance', 'certainty', '4746', 'guinness', 'peat', 'gpg', 'profitability', 'inevitably', 'weiss', '9.77', '6.93', 'pleasing', 'stemmed', 'consolidate', 'tyndall', 'mid-east', 'newcrest', 'abnormals', '20.81', '42.4', 'telfer', 'boddington', 'grades', 'evades', 'dense', 'bushland', 'occured', '6.30', '2030', 'glenwood', 'maryborough', 'emergent', 'quarantine', 'sightings', '.22', 'self-loading', 'probability', 'bushman', 'fixed-wing', 'cordon', 'sq', 'littered', 'caves', 'hideout', 'enabled', 'evade', 'heated', 'tasmania', 'rampage', 'penal', 'ek', 'chor', 'motorcyle', 'shanghai-ek', 'sino-thai', 'engines', 'pudong', 'automobile', '1.56', 'xingfu', 'motorcycles', 'khmer', 'rouge', 'ieng', 'sary', 'pot', 'aranyaprathet', 'dissident', 'hardliners', 'dnum', 'cambodian', 'ta', 'mok', 'dictatorial', 'copy', 'absentia', 'cambodia', '1975-1979', 'overwork', 'french-educated', 'brother-in-law', 'phnom', 'penh', 'russian-made', 'mi-17', 'mouly', 'resupply', 'stung', 'treng', 'mof', 'kubo', 'geared', 'worsening', 'supplementary', 'contraction', 'smoothly', 'mid-september', 'april-june', 'acknowledge', 'wartime', 'tide', 'resurgent', 'militarism', 'atrocities', 'unrepentant', 'militarists', 'undecided', 'indignant', 'shrine', 'dedicated', 'whitewash', '1931', 'genuinely', 'apologised', 'remorse', 'sakigake', 'masayoshi', 'takemura', 'smallest', 'ldp', 'destabilise', 'splits', 'reform-oriented', 'yukio', 'hatoyama', '49-year-old', 'snubbed', '62-year-old', 'pointedly', 'allies', 'resolve', 'backers', 'tainted', 'ldp-dominated', 'unpopular', 'taxpayer', 'ruined', 'stalled', 'defectors', 'bolts', 'lawmakers', 'eight-month-old', 'dissolve', 'reconvenes', 'hing', '2.7', '65.61', '63.87', '249.53', '242.94', '119.49', '134.40', '23-27', 'engages', 'warehousing', 'hurled', 'consulate-general', 'stromme', '430', 'molotov', 'cocktail', 'parking', 'novelist', 'dai', 'houying', '1966-76', 'revolution', 'intellectuals', '1937', 'anhui', 'teacher', 'hawaii', 'ren', 'translated', 'hwa', 'kay', 'plunges', '30.26', '0.53', 'unloaded', '47.5', '3,684', '7,011', '3,292', '1,683', '5,539', '115,941', '38.4', '83,801', '813', 'editorials', 'straights', 'beijing-funded', 'wen', 'wei', 'stem', 'ming', 'newly-established', 'lead-up', 'judiciary', 'subjected', 'survival', 'indecisive', 'hesitancy', '6441', 'frees', 'dahman', 'gaza-based', 'addameer', 'attorney-general', 'khaled', 'al-qidra', 'qidra', 'false', 'nahed', 'dahlan', 'headlines', 'pais', 'juvenile', 'aleix', 'vidal-quadras', 'catalan', 'defenestration', 'cinco', 'dias', 'santander', 'conquest', 'gaceta', 'negocios', 'caja', 'banisadr', 'abolhassan', 'commandeered', 'round-the-clock', 'fearing', 'gangland-style', 'machinegun', 'heed', 'sworn', 'enemy', 'chiefs', 'iberia', 'installations', 'consists', 'joulwan', 'sheehan', 'copenhagen', 'cleaning', 'aaxis', '10.9', 'logo', 'falsified', 'accounts', 'provisions', '146', 'necessitate', '+45', '33969650', 'balks', 'balked', 'stringent', 'surpasses', 'sewers', 'interfering', 'augment', 'threaten', 'dha', 'coordinate', '1.13', 'monies', 'reparations', 'deducted', 'overseeing', 'anticipated', 'supervision', '1,190', '267', '923', '598', 'york-based', 'overseers', 'percentile', 'emissions', 'caep', 'consultancy', '251/09', 'overland', 'delegations', 'nis', 'tra', '003', 'iae-3', '251/08', 'microfiche', 'di', '96/04', 'micromation', '251/07', 'gaseous', '251/06', 'tacis', '251/05', 'eec', '4064/89', '251/04', '251/03', 'wines', '251/02', 'ecu', '251/01', 'cull', 'obviously', 'examine', 'kiely', 'methodology', 'slaughtered', 'eradication', 'disappoint', 'predicted', '340', 'infections', 'naish', '147,000', 'reluctantly', 'placate', 're-examined', 'considerably', 'culled', 'reopen', 'slapped', 'creutzfeldt-jakob', 'cjd', 'bse-infected', 'blockades', 'roadblocks', 'importing', 'radios', 'blockaded', 'motorways', '0100', 'discovery', 'chopra', \"o'malley\", 'walton', 'iain', 'romero', 'jimenez', '147', 'antoine', 'lebouc', 'curry', 'affleck', 'sorensen', '19.6', 'ekimov', 'giunluca', 'gorini', 'breukink', 'wilfried', 'peeters', 'bart', 'voskamp', 'randolph', '11.20:33', 'lietti', 'mg-technogym', 'maarten', 'bakker', 'olaf', 'fifth-stage', 'zevenaar', 'venray', 'one-dayer', 'overs-a-side', '225-5', '46.4', '4:15.006', '4:23.029', '4:16.141', '4:19.665', '4:11.114', '4:20.341', 'darryn', '44.804', 'fiedler', '45.455', 'florian', 'rousseau', '45.810', 'georgios', 'chimonetos', 'lampros', 'vasilopoulos', '46.538', 'magali', 'faure', 'kathrin', 'freitag', '11.833', '12.033', 'felicia', 'ballanger', 'grichina', '11.776', '12.442', 'tanya', 'dubnicoff', '12.211', '12.208', 'annett', 'neumann', 'enioukhina', '12.434', '12.177).', 'restricts', '225', 'englishmen', '10-1-36-2', 'skying', 'long-on', 'off-side', 'well-flighted', 'pavilion', 'inswinging', 'b-2', 'w-7', '1-82', '2-141', '3-160', '4-174', '5-203', 'saqlain', '10-0-44-1', '10-3-31-1', '10-0-52-0', '10-0-56-1', 'nb-4', '1-57', '2-98', '3-146', '4-200', '5-220', '9.4-1-45-3', '7-0-28-1', '10-1-54-0', '3-0-14-0', '7-1-29-1', 'edgbaston', 'lombardi', 'polti', 'hans', 'clerq', 'jemison', 'servais', 'knaven', '10.57:33', 'fourth-stage', 'doetinchem-doetinchem', 'tunbridge', '40-3', '4-66', '4-45', '82-0', 'hove', '285-6', 'athey', '79-2', '259', 'saggers', '6-65', '8-0', '114', 'watkin', '4-28', 'solanki', '4-31', '166-1', 'barnett', '226-1', 'pooley', 'ramprakash', '5-55', 'fay', '4-77', '202-5', '183', '123-4', '1996-08-30', 'mcgeechan', 'grobbelaar', 'england-based', 'bruce', 'zifa', 'vice-chairman', 'pamire', 'five-nation', 'duvillard', 'argyle', 'segers', 'fashanu', 'heng', 'suan', 'lim', 'pleaded', 'accepting', '69-60', '35-23', '97-94', '39-32', 'jenson', '9-15', '.468', '.436', '.413', 'krizan', 'lila', 'osterloh', 'nanne', 'dahlman', '8-', '.561', '.353', '.602', '.478', '.564', '.459', '.626', '.444', '.403', '.424', '.552', 'slide', 'yankee', 'mulholland', 'bench-clearing', 'kingdome', 'ejected', 'marzano', 'brushed', 'wengert', 'nine-hitter', 'herrera', 'minors', 'baldwin', 'ozzie', 'guillen', '10-4', 'nilsson', 'offerman', 'rick', 'huisman', 'hentgen', '17-7', 'tossing', 'orel', 'hershiser', 'belle', 'yorkers', 'new-found', 'aggressiveness', 'adjusting', 'louder', 'messed', 'adrenalin', 'lanes', 'pitching', 'winningest', 'ron', 'wright', 'double-a', 'greenville', 'pointer', 'class-a', 'mid-season', '11-game', 'minor-league', 'phenom', 'andruw', 'post-season', 'abdellaoui', 'graef', '36th', '10,760', 'honour', 'assembled', 'quartets', '1936', 'anchor', 'autograph', 'ornate', 'dillard', 'lindy', 'remigino', 'hines', 'hasely', 'crawford', 'inspired', 'grand-daughter', 'gina', 'tillman', 'bachini', 'emon', 'bois', 'bronckhorst', 'ferdy', 'romania-hungary', 'much-delayed', 'positively', 'neighbourly', 'consulates', 'thessaloniki', 'observance', 'picks', 'bold', 'ogilvy', 'mather', 'communication', 'linked', 'divorces', 'romantically', 'petition', 'presenter', 'mocked', 'gymnasium', 'liffe', 'apt', 'automated', 'pit', 'tabular', 'gilt', '1/32', '107-12', '107-10', '107-06', '94.26', '97.42', '97.38', '97.34', '96.84', '96.83', '115.62', '115.58', '115.32', 'eurolira', '91.37', '91.36', '91.33', 'euroswiss', '97.79', '97.80', '3,894.00', '3,941.50', 'installs', 'kinshasa', 'cne', '9,446', 'deployed', 'deadlines', 'yoka', 'lye', 'mudaba', 'progressively', 'maniema', 'shaba', 'bandundu', 'installation', 'mobutu', 'sese', 'seko', 'object', 'insists', 'ikimi', 'fact-finding', 'wanting', 'ministerial', 'continuation', 'saro-wiwa', 'restricted', 'beatrix', '1652', 'guns', 'forbidden', 'categories', \"n'djamena\", 'idriss', 'deby', 'nomads', '125-member', 'fraternite', 'matin', 'establishes', 'decentralisation', 'bauza', 'donwahi', 'douati', 'alphonse', 'illicit', 'swine', 'jour', 'lakpe', 'appoints', 'severin', 'kouame', 'tanny', '+225', 'mahala', 'zvornik', 'lieutenant', 'marriner', 'retaliation', 'angry', 'mob', 'long-barreled', 'ak-47', 'lightning', 'berovo', 'cathedral', 'thunderstorm', 'kornblum', 'milosevic', 'greste', 'slobodan', 'defuse', 'manipulation', 'srpska', 'bolster', 'patron', 'rectify', 'expulsions', 'blessing', 'banja', 'luka', 'biljana', 'plavsic', 'oversee', 'mini-state', 'choosing', 'three-member', 'comprised', '2,901.48', 'rbls', 'rao', 'roubles', '2,891.00', 'ffk', '2,746', '2,840', '2,998', '0.042', '139.75', '0.59', '23.6', 'illiquid', 'harder', '406.6', '0.375', 'artyom', 'danielyan', 'kosovo', 'boycotted', 'institutions', 'bajgora', 'donje', 'ljupce', 'podujevo', 'celopek', 'revoked', 'cracked', 'moderates', 'cradle', 'meningitis', 'emanuil', 'ceausu', 'babes', 'infectious', 'virus', 'lasts', 'gastro-intestinal', 'tract', 'vukasin', 'filipovic', 'supplying', 'staging', 'mismanagement', 'finmin', 'raul', 'matos', 'azocar', '1630', 'imf-hosted', 'seminar', 'metric', 'sail', 'cartagena', 'coffee', 'non-oil', 'non-traditional', '334', '302', 'ocei', 'imf-sponsored', '2.240', '2.693', '951', 'foods', '27.4', '24.6', 'jpr', 'cops', 'racket', 'thirteen', 'lago', 'nacion', 'credibility', 'undermined', 'scandals', 'indictment', 'piotti', '3,600', 'dishonest', 'purged', 'brave', 'kandir', 'constitutionally', 'same-day', 'cetes', 'nervousness', '24.25', 'co-ordinated', 'acceptances', 'pagares', '25.10', 'longer-term', 'masked', 'oaxaca', 'assaults', 'credits', '2.209', 'oversupply', '684', 'shortfall', 'inflow', 'lezama', 'newroom', '728', '9554', '05:53', 'chilpancingo', 'pre-electoral', 'bickering', 'acatepec', 'fanned', 'intimidate', 'stirred', 'agir', 'ensemble', 'pour', 'droits', \"l'homme\", 'exerted', 'psychological', 'grabs', 'aguirre', '47-year-old', 'pessina', 'restaurants', 'travelled', 'condemn', 'day-to-day', 'punish', 'landless', 'peasants', 'countryside', 'ecumenical', 'endemic', 'thirty-six', 'massacred', 'para', 'lucas', 'moreira', 'neves', 'bishops', 'flees', 'passport', 'consular', 'anti-corruption', 'soliciting', 'icac', 'anti-graft', 'bribe', '12,940', 'scams', 'honduran', 'passports', 'thinks', 'solve', 'woes', '1,617', 'rajapat', 'warnings', 'pullouts', 'chatichai', 'choonhavan', 'chavalit', 'yongchaiyudh', 'aspiration', 'insincere', 'slowdown', 'switched', 'monarchy', '1932', 'yassin', 'ramle', '60-year-old', 'fundamentalist', 'wrecking', 'confined', 'freeing', 'skhirat', 'purely', 'vital', 'conlon', 'triumphal', '10-week', 'abruptly', '200-an-hour', 'eavesdrop', 'conversations', 'campaigns', 'invaluable', 'captivated', 'worried', 'senator', 'dianne', 'feinstein', 'bump', '50-year-old', 'dogged', 'wrongdoing', 'misconduct', 'questionable', 'judgment', 'selecting', 'advisers', 'revert', 're-elected', 'revelled', 'heartland', 'hoarse', 'voice', 'resolute', 'wit', 'stilted', 'glib', 'piper', 'jaffray', 'tax-exempt', 'compiled', '8/30', '-------------------------', 'a-rated', \"gen'l\", '4.45', '4.40', '+0.05', '4.90', '-----', '5.40', '5.35', '5.55', 'rev', 'muscular', 'dystrophy', 'gene-therapy', 'technique', 'telethon', 'method', 'muscle', 'degenerates', 'adulthood', 'non-working', 'producing', 'dystrophin', 'altered', 'common-cold', 'minimise', 'susceptibility', 'injected', 'mice', 'bred', 'genes', 'experiment', 'fibers', 'diminishing', 'test-tube', 'immune-system', 'oilseeds', 'oilseed', 'assn', '98,000', 'no.1', 'cargill', 'mitsui', 'dreyfus', '10-30', '16,300', 'dns', '212.00', '205.10', 'ww', '202.65', '19,500', '212.25', '204.74', '199.71', '23,500', '9,600', '4,900', '199.56', '18,278', '195.79', 'donation', 'taichung', 'procurement', '108,000', 'soybeans', 'bunge', '11-25', 'pnw', '0.8584', '6-20', '.8787', '31,412', 'pl-480', '303.19', 'buyer', '15-30', '595,400', '319,600', '12,300', '300,800', 'upland', '50,400', '54,800', '100,600', '75,000', '1,700', 'sorghum', '6,200', '156,700', 'pima', '49,900', 'poultry', 'fruits', 'gaining', '25.0', 'quota', 'onic', 'panel', 'cutout', 'offal', 'moines', 'steer', '9.76', '0.03', 'help-wanted', 'uneven', '83.0', '85.0', 'goldstein', 'want-ad', 'hiring', 'matched', 'heist', '690,000', 'jewelry', 'showboat', 'capt', 'andrews', 'videotape', 'suitcase', 'resembling', 'wholesaler', 'schein', 'suitcases', 'closet', 'jewellers', 'mid-twenties', 'distract', 'mcgilley', 'description', 'o.j.', 'simpson', 'hints', 'financially', 'jury', 'gag', 'prohibits', 'acquittal', 'crying', 'blues', 'erroneous', 'jam-packed', 'distanced', 'buffalo', 'wildly', 'supportive', 'gifts', 'year-long', 'limelight', 'supermarket', 'reprinted', 'editions', 'vitriol', 'journalism', 'dignify', 'surgeon', 'discarding', 's.c.', 'amputated', 'improperly', 'disposed', 'deformed', 'infant', 'prosthesis', 'orthopedic', 'educational', 'freezer', 'spoiled', 'crab', 'trap', 'flesh', 'cop', 'shrub', 'guys', 'bagged', 'checker', 'pines', 'drive-through', 'toting', 'earl', 'feugill', 'camouflaged', 'shaggy', 'freeze', 'marines', 'attaching', 'strips', 'burlap', 'disguise', 'staking', 'robberies', 'fast-food', '90-minute', 'stakeout', 'dla', '2.7975', 'logistics', '2.7775', 'nbc', 'consultant', 'reshaped', 'ms-nbc', 'ire', 'repositioning', 'gluten', 'meal', 'steady-higher', 'pickup', '117.00', 'pellets', '320.00', 'decatur', 'il', 'cedar', 'rapids', 'ia', '310.00', 't', '234,324', 'cereals', '105.07', 'ecus', 'provisionally', 'optional-origin', 'enjoys', 'subtracting', '34,277', '109.36', '5432', 'shipyard', '3,500', 'cherbourg', '1,800', 'yeard', 'cutback', 'indre', 'managements', 'curtail', 'estates', 'hub', 'gadoon', 'unearthed', 'police-run', 'cages', 'tando', 'allahyar', 'hyderabad', 'recorder', 'sui', 'technologists', 'sugarcane', 'pillaged', 'gujar', '3,225', 'megawatt', 'on-line', 'mohib', 'textile', 'defaulted', 'leasing', 'modarabas', 'multiply.q', '7.84', 'shahid', 'privatisation', 'sindh', 'ad-interim', 'restraining', 'javedan', 'dadabhoy', 'pvt', '9251-274757', 'directions', 'occupying', 'rebelled', 'wrecked', 'heavily-mined', 'halo', 'roadsides', 'qotbuddin', 'hilal', 'officiated', 'sprinkling', 'petrol', 'andhra', 'pradesh', 'rarest', 'beings', 'roasted', 'appellants', 'plotted', 'k.t.', 'elephant', 'tramples', 'rampaging', '72-year-old', 'trampled', 'hari', 'maya', 'poudels', 'madhumalla', 'asleep', 'beast', 'kingdoms', 'elephants', 'overrun', 'kudapokuna', 'welikanda', 'army-controlled', 'vavuniya', 'undercover', 'vicorp', 'sabourin', 'cfo', 'denver', 'bestop', 'boulder', '1610', 'socal', 'edison', 'kilovolt', 'kv', 'wildfire', 'raging', 'conroy', 'crews', 'fire-related', 'residues', 'megawatts', 'mw', '1,200', 'containment', 'arid', 'windy', 'leong', '1622', 'munis', '0.056', 'municipals', 'semiconductor', 'expectation', 'emerge', 'modem', '2-1/8', '11-3/8', 'modem-chip', 'fast-growing', 'networking', 'elias', 'moosa', 'roberston', 'pmc-sierra', 'chipsets', 'severance', 'randall', 'soundview', 'focusing', 'fastest-growing', 'much-larger', 'develops', 'shrink', 'hambrecht', 'quist', 'low-margin', 'pmc', 'slowing', '206-386-4848', 'housecall', 'sink', 'underperform', '7-3/8', '7-1/8', 'atlanta-based', '0.17', 'non-medicare', 'hospice', 'limitation', 'subsidiaries', '17,024,000', '18,174,000', '31,834,000', '24,137,000', '7,718,000', '6,828,000', '14,668,000', '13,091,000', '9,167,000', '11,175,000', '16,909,000', '10,880,000', '1.05', '1.59', '1.02', '10,650,407', 'forma', '9,306,000', '11,346,000', '17,166,000', '11,046,000', '3,820,000', '4,658,000', '7,047,000', '4,534,000', '5,486,000', '6,688,000', '10,119,000', '6,512,000', '0.37', '0.68', '0.44', '14,775,000', 'oasis', 'gallagher', 'obscene', 'swore', 'hate', 'f...', 'supermodel', 'noel', 'laryngitis', 'house-hunting', 'patsy', 'kensit', 'tickets', 'slough', 'upbeat', 'pretax', '14p', '1009', '12-1', '2p', '468p', '691p', 'hammerson', '8p', '390', 'warburg', 'stances', 'maintaining', 'rental', 'incomes', 'shaved', 'nigel', 'mobbs', 'birt', 'shrinks', '26.5', 'seasonally', '715', '973', 'canadians', '3.72', 'burea', '613', '235-6745', 'palestinian-ruled', 'shaken', 'backdrop', 'four-hour', '0900', 'espionage', 'rings', 'jomhuri', 'eslami', 'photographing', 'pan-turkism', 'exiles', 'fallahiyan', 'distillates', 'kerosene', '99', 'sort', 'noticeable', '45-50', 'differential', 'ports', 'exceed', '27.40', '27.70', '27.22', 'cargoes', '24.00', '24.20', '24.10', '24.24', 'lowest', 'suspicious', 'overhang', 'sulphur', '70-75', 'manuscript', 'thieves', 'testament', 'al-akhbar', 'undated', 'pretended', 'wyche', 'invoked', 'recess', 'confirming', 'predecessor', 'mabus', 'shops', 'shutters', 'exporters', 'purchasing', '1997/98', '199,900', '149,100-a', '74,600', '55,000-b', '161,600', 'a-', '54,600', 'b-', '55,000', 'destinations', 'southland', 'mainframe', 'delivering', 'real-time', 'constitutes', 'contends', 'misappropriating', 'nba', 'continually', 'baxter', 'immuno', 'miilion', 'secures', '747s', 'cos', 'chipset', 'hotels', 'doubletree', 'five-point', 'toxic', 'stock-trade', 'h&r', 'compuserve', 'impasse', 'authorised', 'trashed', 'nudge', 'gop', 'reporter', 're-nomination', 'state-by-state', 'beachcomber', 'highlands', 'foot-long', 'debris', 'bearing', 'markings', 'conducting', 'fireball', 'wallets', 'shoes', 'mechanical', 'leila', 'corcoran', 'writes', 'still-enslaved', 'pleads', 'abraham', 'maimed', 'poses', 'volunteers', 'preserved', 'microfilm', 'stowed', 'rarely', 'enlistment', 'discharge', 'certificates', 'unveiling', 'memorial', '37,000', 'shall', 'oportunity', 'enjoyment', 'sic', 'slavery', 'oppreses', 'liberty', 'outpouring', 'coloured', 'curse', 'separated', '1865', 'well-to-do', 'matron', 'plead', 'dishonourable', 'prisoner', 'thoughtless', 'folly', 'notation', 'regiment', 'pardon', 'anguish', 'amputee', 'terrible', 'haunted', 'posed', 'bare-chested', '1864', 'insight', 'rhythms', 'carbondale', 'editor', 'gen', 'ulysses', 'writings', 'poetic', 'linguistic', 'treasure', 'trove', 'sociology', 'seared', 'consciousness', 'confederacy', 'retirees', 'budge', 'weidman', 'shepherded', 'predicts', 'databases', 'battlefields', 'discharged', 'incapacity', 'inebetude', 'arise', 'masturbation', 're-nominate', '559-mile', 'vow', 'sylvie', 'ajaccio', 'mediterranean', 'defused', 'get-tough', 'jean-louis', 'debre', 'corse', 'lax', 'widely-reported', 'powerless', 'france-soir', 'beauvau', 'nightly', 'figaro', 'shaky', 'seven-month', 'racked', 'low-level', 'separatist-inspired', 'principally', 'backlash', 'om', 'gruppen', 'omlx', 'pulpex', 'pulp', 'timber', 'recycled', 'complements', 'softs', 'cocoa', 'unpredictable', 'risky', 'hedge', '+46-8-700', '1006', 'amsterdam-rotterdam-antwerp', 'tankage', 'week-ago', '29/8/96', '22/8/96', '1/9/95', '400-425', '425', 'naphtha', '50-75', '75-100', '1,650', '1,850-1,900', '325-350', 'kero', '15-20', 'throughput', 'straight-run', 'bunkering', 'blenkinsop', 'anti-nuclear', 'pantomime', 're-enacting', 'brandished', 'theatre-prop', 'gorleben', 'depot', 'mafia', 'catania', 'sicily', 'slaying', '14-year-old', 'nephew', 'puglisi', 'salvatore', 'botta', 'cemetery', 'sicilian', 'hardened', 'anti-mafia', 'tip-off', 'consciences', 'nitto', 'santapaola', 'knelt', 'ambush', 'cemetary', 'canteen', 'limerick', 'warders', 'takings', 'italians', 'hiv-pensioner', 'harassing', 'hookers', '61-year-old', 'aids', 'pensioner', 'pietro', 'hiv', 'cruising', 'red-light', 'hurling', 'blanks', 'sighted', 'arctic', 'spitzbergen', 'rune', 'ntb', 'vnukovo', 'tupolev', 'longyearbyen', 'airstrip', 'rescuers', 'three-engine', 'opera', 'mountainside', '0815', 'coal-mining', 'barentsburg', '1920s', 'galeforce', 'meteorological', 'cellars', 'trees', 'uprooted', 'roofs', 'trains', 'cm', '2.24', '7.4', '2.96', 'communes', 'rmt', 'turnhout', 'scouts', 'camping', 'meadow', 'hindered', 'excavations', 'jumet', 'sex-and-murder', 'lightly', 'tides', 'pesetas', 'chemicals', '4,150', '61.45', '61.94', '4,175', 'madness', 'overreacted', '+34', '585', '2161', 'nahar', 'liberte', 'leveilly', 'finns', 'sex-abuse', 'captive', 'tampere', 'luxury', 'ilkka', 'laasonen', 'iltalehti', 'audi', 'ingolstadt', 'demel', 'hedged', 'kekkila', 'full-yr', 'fertilisers', 'saplings', 'trend', 'fluctuations', 'end-year', 'interview-t&n', 'untroubled', 't&n', 'bumble', 'predict', 'echoing', 'automotive', 'equally', 'predicting', 'rationalised', 'destocked', '9.5', 'destocking', 'relaxed', 'cycle', 'fraction', 'commenting', 'piston', 'kolbenschmidt', 'obstacles', 'huddart', '8716', 'jolts', 'zealands', 'waiau', 'spa', 'hanmer', 'prone', 'earthquakes', 'smooth', 'trevelyan', 'half-yearly', 'absolutely', 'predicated', 'precepts', 'trough', 'draconian', 'rentals', 'reclamation', 'narrowly', 'downtrend', 'hover', 't$', '27.482', '27.495', '275', '2-5080815', '20,500', '20,605', 'touching', 'intraday', '20,530', '20,725', '19,560', 'technically', '20,300', '21,000', 'doreen', 'siow', '65-8703092', 'siam', 'banker', '8.46', '662', '652-0642', \"m'bishi\", '7-year', 'tokyo-mitsubishi', '2.95', 'sep.03', 'sep.96', 'int', 'mar.97', 'sub', 'jul-18.jul', 'jcr', 'jbri', 'daewoo', 'dacom', '822', '727', '5644', 'commem', 'manufactures', 'ski', 'antara', 'evident', 'happening', 'motivated', 'major-general', 'utomo', 'indonesias', 'extinguished', 'injures', 'exaggerate', '11.38', '11.45', '918', '490', '538', 'rents', 'haneda', 'itami', 'beijing-backed', 'post-handover', 'contesting', 'stymies', '400-strong', 'dismantle', 'fully-elected', 'considerable', 'directorate-grade', 'bureaucrats', '33,000', 'tier', 'mandarin', 'secretaries', 'src', 'barrel-per-day', 'distillation', 'stuck', 'x-ray', 'no.3', 'varied', 'exchanger', '285,000', 'co-owned', 'petrolem', 'joint-venture', 'chevron', 'texaco', '+65-8703086', 'loxley', '332.66', 'reviewed', '6.66', '266.37', '662-252-9950', 'mth', 'pvs', 'yr-ago', '+0.1', '+0.0', '119.3**', '+3.7', '+3.6', '+4.7', '119.3', '+0,2', '+3.5', '+5.2', 'jobless', 'inem', '63,913', '33,149', '65,345', '2.17m', '13.67', '14.15', '15.19', '196.8', '180.6', '279.9', 'cur', '110.4', '+1,161', '+400.9', '+310.4', '54,703.0', '+0.2', '119.6**', '+1.2', '+1.5', '+7.1', '119.6', 'prod', '+1.0', '+9.8', '108.4**', 'm4', '+2.6', '+4.2r', '+10.8', 'adj', 'trln', '75.912', '1,100.7', '1,164.1', '988.2', '1,315.7', '1,433.4', '1,236.5', '215.0', '269.3', '248.3', '1,334.0', '1,119.0', '1,420.9', 'govt.budget', 'govt.fcast', '+282.1', '380.6', '+230.4', 'def', '1,184.0', '1,466.1', '1,456.7', 'qtr', 'epa', '+168,130', '+31,230', '+167,330', 'yr-yr', '+1.9', '+2.3r', '+3.4', '18.1', '16.9', '69.7', '7.25', '7.50', '04/06/96', 'customs-cleared', 'annualised', 'ine', 'variation', 'total-', 'corresponds', 'relate', 'finances', '**general', '100=1992', '100=1990', 'obstructing', 'lasa-zabala', 'gal', 'prescriptions', 'gomez', 'liano', 'aznar', 'bch', 'hive', 'coopers', 'lybrand', 'emigrates', 'lenzing', 'viscose', 'fibre', 'preview', '84.5', 'schillings', 'fibres', 'economies', '+431', '53112', 'fundamentalists', 'masterminds', 'ideologists', 'financers', 'clarifications', 'clarification', '1676/96', 'amending', '2454/93', '2913/92', 'donna', 'topic', 'pundits', 'debated', 'forgo', 'unflagging', 'sidestepped', 'strong-dollar', 'bentsen', 'viewed', 'distinctively', 'widness', 'timely', 'instances', 'post-second', '1.3438', '79.75', 'stands', '1.48', 'expertise', 'co-chairman', 'faust', 'bailard', 'biehl', 'kaiser', 'awfully', 'bentsen-era', 'greenspan', 'reappointment', 'perelstein', 'mainstay', 'amstetten', 'ewald', 'brenner', 'stieglmair', 'brunmayr', '43rd', 'marino', 'hartson', 'best-of-three', 'ex-world', '24-kms', 'samokhalova', 'spirited', 'quigley', 'numerical', 'superiority', 'goulnara', 'fatkoullina', 'snatching', 'lapped', 'ingrid', 'haringa', 'lancien', '12.341', '12.348', '12.130', '12.124', '12.112', '12.246', '11.959', '12.225', '24-km', '31.081', 'tatiana', 'stiajkina', 'arndt', 'vikstedt-nyman', 'boyden', 'godras', 'kombouare', 'abderdeen', '467,000', 'aitken', 'affection', 'ginola', 'influential', 'influenced', 'imola', 'doohan', '50.250', 'bayle', '1:50.727', 'norifumi', 'abe', '1:50.858', 'luca', 'cadalora', '1:51.006', 'criville', '1:51.075', '1:51.287', 'tadayuki', 'okada', '1:51.528', 'checa', '1:51.588', '1:51.784', 'shinichi', 'itoh', '1:51.857', '216', '217', 'swe', 'bradley', 'hughes']\n" ] } ], "source": [ "v = build_vocab(slowa_train)\n", "v.set_default_index(v[\"\"])\n", "itos = v.get_itos() # mapowanie indeksów na tokeny\n", "print(len(itos)) # liczba różnych tokenów w słowniku\n", "print(itos)" ] }, { "cell_type": "code", "execution_count": 66, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "{'B-ORG': 0, 'O': 1, 'B-MISC': 2, 'B-PER': 3, 'I-PER': 4, 'B-LOC': 5, 'I-ORG': 6, 'I-MISC': 7, 'I-LOC': 8}\n" ] } ], "source": [ "# slownik etykiety - kody etykiet\n", "etykieta_na_kod = {}\n", "licznik = 0\n", "for tekst in train[\"y\"]:\n", " for etykieta in tekst.split(\" \"):\n", " if etykieta not in etykieta_na_kod:\n", " etykieta_na_kod[etykieta] = licznik\n", " licznik+=1\n", "print(etykieta_na_kod)" ] }, { "cell_type": "code", "execution_count": 67, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[0, 1, 2, 1, 1, 1, 2, 1, 1, 1, 3, 4, 1, 5, 1, 1, 1, 0, 6, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 0, 6, 1, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 3, 4, 4, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 2, 1, 1, 1, 1, 5, 1, 5, 1, 1, 1, 1, 1, 1, 1, 2, 7, 7, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 3, 4, 4, 1, 1, 1, 3, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 5, 1, 3, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 0, 6, 6, 6, 6, 1, 0, 1, 1, 3, 4, 4, 1, 1, 0, 6, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]\n" ] } ], "source": [ "# podziel etykiety\n", "kody_etykiet_train = []\n", "for tekst in train[\"y\"]:\n", " pom = []\n", " for etykieta in tekst.split(\" \"):\n", " pom.append(etykieta_na_kod[etykieta])\n", " kody_etykiet_train.append(pom)\n", "print(kody_etykiet_train[0])" ] }, { "cell_type": "code", "execution_count": 68, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "O O B-ORG O O O O O O O O O B-LOC O O B-MISC I-MISC O B-PER I-PER O O O O O O O B-ORG O B-ORG O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-ORG O B-ORG O B-ORG O O O O O O B-ORG O O O O O O O O O O B-ORG O O O O B-ORG O O O O O O O O B-LOC I-LOC O B-ORG O O O O O O O O O O O O O O B-LOC O B-PER I-PER O O O O O O O O O O B-ORG O O O O O O O O O B-PER O O O O O O O O O O B-ORG O O O O O O O O O O O B-PER I-PER O B-PER I-PER O O O O O O O O O B-ORG O B-LOC O O B-PER O O O O B-LOC O O O O O O O O O O O O O O O O B-ORG O O O O O O O O O O O O O O O B-ORG O O O O O O O O O B-PER O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-LOC O B-ORG O B-PER I-PER O O O O O B-LOC O O O O O O O O O O O O O O O O O O O O O O O O O B-ORG O O O O O O O B-LOC O B-PER I-PER O O O O B-ORG O O O O O O O O O O O O B-ORG O O O O O O O O O O O O O B-ORG O O O O O O O O O O O O O O O O O O O O B-MISC B-PER I-PER O O O O O B-PER I-PER O O O O B-PER I-PER O O O O B-ORG O O O O O O O O O O O O O O O O O O O O O O O O O O O O B-ORG O O O O O O B-ORG O O O O O O O O O O O O O B-PER I-PER O B-MISC O O B-PER I-PER O O O O O O O O B-ORG O O O O O O O\n", "456\n", "[1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 2, 7, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 5, 8, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 4, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 5, 1, 1, 3, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 0, 1, 3, 4, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 5, 1, 3, 4, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 3, 4, 1, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 4, 1, 2, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1]\n", "456\n" ] } ], "source": [ "# odczytaj etykiety dev-0\n", "labels_dev0 = pd.read_csv('dev-0/expected.tsv', sep='\\t', names=['y'], header=None)\n", "\n", "print(labels_dev0[\"y\"][0])\n", "print(len(labels_dev0[\"y\"][0].split(\" \")))\n", "\n", "# podziel etykiety\n", "kody_etykiet_dev0 = []\n", "for tekst in labels_dev0[\"y\"]:\n", " pom = []\n", " for etykieta in tekst.split(\" \"):\n", " pom.append(etykieta_na_kod[etykieta])\n", " kody_etykiet_dev0.append(pom)\n", "\n", "print(kody_etykiet_dev0[0])\n", "print(len(kody_etykiet_dev0[0]))" ] }, { "cell_type": "code", "execution_count": 69, "metadata": {}, "outputs": [], "source": [ "def data_process(dt):\n", " # Wektoryzacja dokumentów tekstowych.\n", " return [\n", " torch.tensor(\n", " [v[\"\"]] + [v[token] for token in document] + [v[\"\"]],\n", " dtype=torch.long,\n", " )\n", " for document in dt\n", " ]\n", "\n", "def labels_process(dt):\n", " # Wektoryzacja etykiet (NER)\n", " return [torch.tensor([0] + document + [0], dtype=torch.long) for document in dt]" ] }, { "cell_type": "code", "execution_count": 70, "metadata": {}, "outputs": [], "source": [ "train_tokens_ids = data_process(slowa_train)\n", "test_dev0_tokens_ids = data_process(slowa_test_dev0)\n", "test_A_tokens_ids = data_process(slowa_test_A)\n", "\n", "train_labels = labels_process(kody_etykiet_train)\n", "test_dev0_labels = labels_process(kody_etykiet_dev0)" ] }, { "cell_type": "code", "execution_count": 71, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "945 491\n", "215 458\n", "230 443\n", "tensor([ 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 13,\n", " 16, 17, 13, 18, 19, 20, 21, 22, 23, 24, 25, 26, 6, 27,\n", " 8, 28, 8, 29, 10, 11, 30, 31, 32, 33, 34, 35, 36, 37,\n", " 38, 39, 8, 40, 12, 13, 41, 42, 43, 8, 18, 19, 44, 42,\n", " 45, 46, 47, 48, 21, 22, 49, 28, 50, 51, 52, 53, 54, 55,\n", " 56, 57, 30, 18, 58, 27, 59, 60, 12, 13, 61, 62, 63, 64,\n", " 65, 66, 67, 68, 69, 62, 63, 64, 70, 66, 71, 72, 24, 73,\n", " 61, 18, 20, 42, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83,\n", " 12, 13, 84, 21, 85, 58, 86, 59, 87, 88, 89, 24, 59, 90,\n", " 91, 92, 59, 93, 24, 50, 38, 94, 95, 18, 19, 44, 12, 13,\n", " 84, 21, 81, 96, 97, 98, 95, 4, 99, 100, 101, 102, 8, 103,\n", " 40, 104, 73, 105, 88, 106, 107, 53, 18, 108, 88, 109, 110, 111,\n", " 59, 81, 112, 113, 88, 114, 115, 8, 116, 108, 117, 12, 13, 102,\n", " 118, 119, 120, 121, 122, 53, 57, 88, 123, 91, 124, 125, 126, 40,\n", " 127, 128, 129, 130, 131, 132, 133, 134, 135, 34, 35, 36, 12, 13,\n", " 136, 102, 137, 8, 138, 139, 96, 121, 18, 4, 42, 140, 45, 46,\n", " 73, 141, 109, 117, 142, 73, 143, 89, 67, 92, 59, 144, 145, 146,\n", " 59, 147, 81, 148, 149, 8, 108, 117, 12, 13, 150, 99, 151, 152,\n", " 153, 154, 155, 156, 157, 102, 158, 159, 4, 99, 160, 161, 162, 163,\n", " 164, 165, 166, 167, 61, 168, 169, 12, 61, 13, 12, 13, 147, 123,\n", " 88, 57, 170, 102, 42, 96, 12, 13, 18, 4, 42, 58, 45, 88,\n", " 171, 172, 173, 174, 8, 175, 18, 176, 177, 178, 98, 88, 179, 180,\n", " 8, 18, 181, 45, 142, 12, 13, 40, 182, 183, 184, 185, 8, 128,\n", " 186, 73, 81, 187, 36, 188, 8, 133, 189, 190, 191, 8, 182, 184,\n", " 192, 8, 193, 167, 194, 195, 109, 196, 12, 13, 10, 197, 198, 22,\n", " 23, 146, 59, 66, 199, 8, 108, 117, 53, 200, 40, 73, 136, 201,\n", " 202, 91, 6, 203, 27, 8, 28, 8, 204, 10, 11, 205, 206, 28,\n", " 207, 208, 12, 13, 61, 209, 62, 182, 8, 38, 210, 211, 163, 190,\n", " 212, 55, 54, 173, 213, 8, 214, 41, 42, 215, 73, 61, 216, 217,\n", " 197, 161, 44, 132, 218, 134, 219, 220, 221, 222, 21, 22, 223, 224,\n", " 12, 13, 225, 226, 227, 228, 8, 116, 229, 117, 121, 230, 231, 232,\n", " 233, 234, 121, 81, 10, 235, 236, 237, 127, 128, 159, 238, 188, 8,\n", " 34, 35, 36, 95, 239, 240, 241, 12, 13, 41, 242, 243, 40, 53,\n", " 57, 97, 244, 73, 245, 246, 163, 247, 248, 12, 13, 24, 249, 233,\n", " 250, 251, 163, 10, 252, 73, 253, 254, 255, 163, 256, 248, 12, 13,\n", " 3])\n", "tensor([ 2, 2005, 640, 2049, 214, 779, 158, 386, 121, 2094,\n", " 1802, 12, 13, 265, 19358, 13, 1005, 5480, 2289, 1697,\n", " 2052, 768, 2171, 72, 8937, 22, 1098, 145, 2049, 1762,\n", " 2021, 95, 159, 2094, 88, 3721, 2987, 233, 395, 951,\n", " 8, 214, 779, 158, 18, 1815, 163, 18, 2006, 2007,\n", " 12, 13, 200, 4835, 22, 386, 73, 6024, 73, 1066,\n", " 38, 14326, 145, 1975, 392, 2038, 73, 9340, 88, 2074,\n", " 416, 1362, 233, 22, 1802, 481, 2041, 3394, 309, 72,\n", " 2855, 371, 233, 200, 16878, 1772, 746, 2068, 12, 13,\n", " 121, 2137, 2021, 788, 72, 6261, 22, 18, 382, 3407,\n", " 158, 14885, 3408, 73, 2049, 1200, 200, 652, 2094, 95,\n", " 2112, 2987, 1023, 1592, 6184, 788, 72, 0, 26, 1348,\n", " 0, 2828, 14773, 1982, 992, 72, 6261, 12, 13, 8333,\n", " 95, 0, 73, 2021, 2967, 81, 5593, 1575, 8, 200,\n", " 501, 2094, 1023, 2052, 6760, 233, 8, 0, 1088, 788,\n", " 72, 16349, 12, 13, 2038, 73, 1287, 73, 2539, 3442,\n", " 8, 14563, 200, 386, 975, 121, 14761, 2102, 88, 14,\n", " 67, 408, 1088, 81, 1125, 13917, 22, 200, 1772, 746,\n", " 2084, 158, 2083, 12, 13, 2102, 73, 411, 1532, 8,\n", " 1348, 42, 9847, 5710, 73, 6469, 14794, 73, 139, 652,\n", " 2007, 6162, 163, 18, 1844, 73, 145, 2038, 6329, 0,\n", " 88, 768, 81, 652, 2094, 215, 163, 2869, 12, 13,\n", " 95, 18, 1599, 2084, 155, 4486, 91, 301, 81, 0,\n", " 6485, 136, 7294, 67, 155, 0, 200, 5382, 73, 1982,\n", " 2171, 72, 677, 233, 9000, 3384, 88, 1971, 1088, 9164,\n", " 22, 3383, 72, 1881, 88, 9896, 72, 6164, 12, 13,\n", " 158, 18, 2093, 73, 2074, 2526, 1825, 2115, 73, 2167,\n", " 2168, 0, 95, 1348, 73, 1241, 8, 4778, 139, 4601,\n", " 145, 84, 5703, 139, 2171, 72, 1355, 22, 23, 26,\n", " 5493, 790, 788, 22, 1098, 233, 18, 1772, 746, 2076,\n", " 12, 13, 84, 59, 1490, 170, 95, 1348, 17445, 1684,\n", " 0, 318, 3394, 1663, 145, 2074, 1362, 22, 0, 72,\n", " 1095, 73, 81, 215, 163, 0, 12, 13, 9340, 844,\n", " 309, 18, 5713, 72, 200, 652, 2007, 1975, 765, 19457,\n", " 95, 5429, 2082, 8, 6697, 72, 1881, 233, 200, 501,\n", " 2094, 73, 712, 550, 2987, 1836, 53, 8607, 159, 2094,\n", " 3778, 12, 13, 334, 1721, 584, 768, 996, 72, 2869,\n", " 136, 1825, 2772, 73, 0, 73, 88, 1686, 0, 73,\n", " 6272, 73, 768, 9340, 8, 0, 88, 81, 652, 2094,\n", " 215, 163, 0, 12, 13, 121, 18, 0, 163, 6016,\n", " 18, 382, 1451, 163, 200, 1772, 12355, 6360, 95, 18,\n", " 6167, 73, 2041, 6760, 309, 81, 6675, 8, 0, 2068,\n", " 72, 0, 12, 13, 322, 312, 428, 309, 95, 81,\n", " 0, 5763, 53, 1671, 2807, 136, 0, 2284, 2285, 1949,\n", " 0, 768, 2171, 72, 3892, 12, 13, 95, 0, 2041,\n", " 155, 6329, 2053, 72, 992, 12, 13, 3])\n", "tensor([ 2, 1759, 640, 1677, 1997, 6422, 2306, 73, 345, 233,\n", " 3805, 3778, 12, 13, 0, 0, 13, 0, 73, 820,\n", " 1077, 1078, 0, 13, 1677, 1315, 18, 3104, 163, 200,\n", " 5613, 1770, 1975, 26, 81, 6422, 1763, 2306, 746, 667,\n", " 233, 81, 391, 2103, 2007, 1772, 22, 1098, 12, 13,\n", " 136, 345, 4535, 200, 3815, 4790, 1088, 233, 18, 501,\n", " 1772, 163, 18, 391, 73, 7709, 8, 81, 3805, 2328,\n", " 3778, 8, 17348, 0, 12, 13, 345, 1114, 939, 163,\n", " 18, 1772, 88, 4535, 3692, 3916, 6349, 30, 18, 2403,\n", " 2302, 1108, 0, 2164, 0, 0, 768, 6485, 163, 81,\n", " 0, 754, 9477, 8, 11483, 18, 6366, 779, 18, 3888,\n", " 368, 11451, 88, 301, 159, 7667, 1373, 12, 13, 0,\n", " 0, 3394, 4647, 163, 18, 2306, 233, 3841, 371, 73,\n", " 6365, 159, 0, 1156, 6322, 2940, 53, 1876, 923, 18,\n", " 3741, 12, 13, 18, 314, 5957, 1126, 59, 3817, 233,\n", " 159, 5613, 1770, 3123, 2488, 72, 18, 652, 371, 12,\n", " 13, 781, 2856, 18, 5613, 1839, 1975, 395, 1201, 2577,\n", " 73, 0, 173, 233, 18, 3123, 145, 12225, 12, 13,\n", " 395, 2357, 53, 754, 12990, 233, 18, 97, 996, 3097,\n", " 2999, 1677, 8, 3918, 53, 1572, 88, 8962, 416, 992,\n", " 1469, 53, 200, 382, 162, 746, 667, 12, 13, 0,\n", " 0, 2159, 18, 1832, 233, 18, 0, 2302, 73, 3776,\n", " 8, 1815, 81, 0, 0, 5287, 425, 18, 710, 426,\n", " 189, 9691, 0, 0, 691, 8, 182, 14169, 136, 2000,\n", " 2999, 8, 17948, 301, 18, 1373, 12, 13, 24, 59,\n", " 18, 501, 6799, 17399, 95, 667, 233, 2171, 3097, 12,\n", " 13, 7236, 875, 18629, 472, 8, 0, 81, 183, 6366,\n", " 301, 18, 3741, 233, 18, 1781, 2302, 136, 147, 10460,\n", " 8, 0, 24, 301, 18, 386, 11605, 163, 0, 42,\n", " 426, 12, 13, 0, 0, 155, 1635, 667, 18, 215,\n", " 26, 81, 0, 9477, 233, 18, 2983, 2302, 12, 13,\n", " 1677, 2000, 6670, 0, 8, 18, 710, 2338, 3741, 72,\n", " 939, 163, 18, 2210, 136, 20403, 0, 18, 710, 3104,\n", " 12, 13, 0, 5634, 661, 4851, 0, 0, 322, 1121,\n", " 12, 13, 1677, 2532, 0, 0, 21, 380, 161, 161,\n", " 18, 710, 961, 426, 15063, 6422, 72, 596, 12, 13,\n", " 18, 714, 2159, 177, 88, 2000, 2489, 0, 88, 8579,\n", " 183, 3384, 189, 3394, 24, 5616, 72, 596, 12, 161,\n", " 13, 161, 13, 1677, 73, 0, 163, 18, 1654, 1770,\n", " 233, 1590, 88, 3806, 11627, 233, 18, 1654, 95, 12663,\n", " 73, 173, 12675, 8, 14563, 200, 1975, 719, 12, 13,\n", " 0, 1071, 2008, 933, 88, 1705, 2589, 214, 22, 2609,\n", " 22, 4025, 233, 391, 81, 2010, 12, 13, 416, 2171,\n", " 2957, 173, 912, 26, 808, 3894, 3024, 53, 808, 2210,\n", " 12, 13, 3])\n" ] } ], "source": [ "print(len(train_tokens_ids), len(train_tokens_ids[0]))\n", "print(len(test_dev0_tokens_ids), len(test_dev0_tokens_ids[0]))\n", "print(len(test_A_tokens_ids), len(test_A_tokens_ids[0]))\n", "\n", "print(train_tokens_ids[0])\n", "print(test_dev0_tokens_ids[0])\n", "print(test_A_tokens_ids[0])" ] }, { "cell_type": "code", "execution_count": 72, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "945 491\n", "215 458\n", "tensor([0, 0, 1, 2, 1, 1, 1, 2, 1, 1, 1, 3, 4, 1, 5, 1, 1, 1, 0, 6, 1, 1, 1, 1,\n", " 1, 1, 2, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 5, 1, 1, 1, 1, 0, 6, 1, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 0, 1, 1, 1, 3, 4, 4, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 6, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 0, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 2, 1, 1, 1, 1, 5, 1, 5, 1,\n", " 1, 1, 1, 1, 1, 1, 2, 7, 7, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1,\n", " 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 3, 4, 4, 1, 1, 1, 3, 1, 1, 0, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 5, 1, 3, 1, 1, 1, 1,\n", " 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 0, 6, 6, 6,\n", " 6, 1, 0, 1, 1, 3, 4, 4, 1, 1, 0, 6, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 5, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0])\n", "tensor([0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 2, 7, 1, 3, 4, 1, 1, 1,\n", " 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1,\n", " 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 5, 8, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5,\n", " 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 4,\n", " 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 5, 1, 1, 3, 1, 1, 1, 1, 5, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1,\n", " 0, 1, 3, 4, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 5, 1, 3, 4, 1,\n", " 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 2, 3, 4, 1, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 0,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 3, 4, 1, 2, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1,\n", " 1, 0])\n" ] } ], "source": [ "print(len(train_labels), len(train_labels[0]))\n", "print(len(test_dev0_labels), len(test_dev0_labels[0]))\n", "\n", "print(train_labels[0])\n", "print(test_dev0_labels[0])" ] }, { "cell_type": "code", "execution_count": 73, "metadata": {}, "outputs": [], "source": [ "def get_scores(y_true, y_pred):\n", " # Funkcja zwraca precyzję, pokrycie i F1\n", " acc_score = 0\n", " tp = 0\n", " fp = 0\n", " selected_items = 0\n", " relevant_items = 0\n", "\n", " for p, t in zip(y_pred, y_true):\n", " if p == t:\n", " acc_score += 1\n", "\n", " if p > 0 and p == t:\n", " tp += 1\n", "\n", " if p > 0:\n", " selected_items += 1\n", "\n", " if t > 0:\n", " relevant_items += 1\n", "\n", " if selected_items == 0:\n", " precision = 1.0\n", " else:\n", " precision = tp / selected_items\n", "\n", " if relevant_items == 0:\n", " recall = 1.0\n", " else:\n", " recall = tp / relevant_items\n", "\n", " if precision + recall == 0.0:\n", " f1 = 0.0\n", " else:\n", " f1 = 2 * precision * recall / (precision + recall)\n", "\n", " return precision, recall, f1" ] }, { "cell_type": "code", "execution_count": 74, "metadata": {}, "outputs": [], "source": [ "num_tags = len(etykieta_na_kod.keys())\n", "\n", "class LSTM(torch.nn.Module):\n", "\n", " def __init__(self):\n", " super(LSTM, self).__init__()\n", " self.emb = torch.nn.Embedding(len(v.get_itos()), 100)\n", " self.rec = torch.nn.LSTM(100, 256, 1, batch_first=True)\n", " self.fc1 = torch.nn.Linear(256, num_tags)\n", "\n", " def forward(self, x):\n", " emb = torch.relu(self.emb(x))\n", " lstm_output, (h_n, c_n) = self.rec(emb)\n", " out_weights = self.fc1(lstm_output)\n", " return out_weights" ] }, { "cell_type": "code", "execution_count": 75, "metadata": {}, "outputs": [], "source": [ "def eval_model(dataset_tokens, dataset_labels, model):\n", " Y_true = []\n", " Y_pred = []\n", " for i in tqdm(range(len(dataset_labels))):\n", " batch_tokens = dataset_tokens[i].unsqueeze(0)\n", " tags = list(dataset_labels[i].numpy())\n", " Y_true += tags\n", "\n", " Y_batch_pred_weights = model(batch_tokens).squeeze(0)\n", " Y_batch_pred = torch.argmax(Y_batch_pred_weights, 1)\n", " Y_pred += list(Y_batch_pred.numpy())\n", "\n", " return get_scores(Y_true, Y_pred)" ] }, { "cell_type": "code", "execution_count": 76, "metadata": {}, "outputs": [], "source": [ "lstm = LSTM()\n", "criterion = torch.nn.CrossEntropyLoss()\n", "optimizer = torch.optim.Adam(lstm.parameters())\n", "NUM_EPOCHS = 2 #100 #50" ] }, { "cell_type": "code", "execution_count": 77, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 945/945 [00:25<00:00, 36.80it/s]\n", "100%|██████████| 945/945 [00:31<00:00, 30.23it/s]\n" ] } ], "source": [ "for i in range(NUM_EPOCHS):\n", " lstm.train()\n", " # for i in tqdm(range(500)):\n", " for i in tqdm(range(len(train_labels))):\n", " batch_tokens = train_tokens_ids[i].unsqueeze(0)\n", " tags = train_labels[i].unsqueeze(1)\n", "\n", " predicted_tags = lstm(batch_tokens)\n", "\n", " optimizer.zero_grad()\n", " loss = criterion(predicted_tags.squeeze(0), tags.squeeze(1))\n", "\n", " loss.backward()\n", " optimizer.step()\n", "\n", " lstm.eval()" ] }, { "cell_type": "code", "execution_count": 78, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 215/215 [00:00<00:00, 238.89it/s]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "(0.8949339082089975, 0.8914443942133815, 0.8931857430003114)\n" ] } ], "source": [ "print(eval_model(test_dev0_tokens_ids, test_dev0_labels, lstm))" ] }, { "cell_type": "code", "execution_count": 79, "metadata": {}, "outputs": [], "source": [ "def zwroc_przewidywania(tokeny):\n", " Y_pred = []\n", " for i in tqdm(range(len(tokeny))):\n", " pom1 = lstm(tokeny[i])\n", " #print(pom1)\n", " pom2 = torch.argmax(pom1,1)\n", " #print(pom2)\n", " pom3 = list(pom2.numpy())\n", " #print(pom3)\n", " Y_pred.append(pom3)\n", " return Y_pred" ] }, { "cell_type": "code", "execution_count": 80, "metadata": {}, "outputs": [], "source": [ "# i usun bos, eos\n", "def zamien_przewidziane_kody_na_etykiety(przewidywania):\n", " etykiety = []\n", " for lista in przewidywania:\n", " pom = []\n", " for kod in lista:\n", " etykieta = None\n", " for e, k in etykieta_na_kod.items():\n", " if kod == k:\n", " etykieta = e\n", " pom.append(etykieta)\n", " etykiety.append(pom)\n", " del pom[0]\n", " del pom[-1]\n", " return etykiety" ] }, { "cell_type": "code", "execution_count": 81, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 215/215 [00:00<00:00, 247.70it/s]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "(0.8949339082089975, 0.8914443942133815, 0.8931857430003114)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 215/215 [00:00<00:00, 239.42it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[0, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 5, 8, 1, 1, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 8, 1, 6, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 5, 1, 1, 1, 1, 1, 6, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 6, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 5, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 6, 6, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 4, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 6, 1, 1, 1, 1, 1, 8, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 4, 1, 5, 6, 1, 6, 6, 1, 1, 1, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 0]\n", "458\n", "['O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'B-LOC', 'I-LOC', 'O', 'O', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-PER', 'I-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'I-LOC', 'O', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'I-ORG', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'B-PER', 'I-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'I-ORG', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'I-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'I-LOC', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'I-PER', 'O', 'B-LOC', 'I-ORG', 'O', 'I-ORG', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-PER', 'I-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O']\n", "456\n", "tensor([0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 2, 7, 1, 3, 4, 1, 1, 1,\n", " 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1,\n", " 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 5, 8, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5,\n", " 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 4,\n", " 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 5, 1, 1, 3, 1, 1, 1, 1, 5, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1,\n", " 0, 1, 3, 4, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 5, 1, 3, 4, 1,\n", " 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 2, 3, 4, 1, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 0,\n", " 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n", " 1, 3, 4, 1, 2, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1,\n", " 1, 0])\n", "458\n", "[1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 2, 7, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 5, 8, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 4, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 5, 1, 1, 3, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 0, 1, 3, 4, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 5, 1, 3, 4, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 3, 4, 1, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 3, 4, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 4, 1, 2, 1, 1, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1]\n", "456\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "\n" ] } ], "source": [ "print(eval_model(test_dev0_tokens_ids, test_dev0_labels, lstm))\n", "przewidywania_kody_test_dev0 = zwroc_przewidywania(test_dev0_tokens_ids)\n", "print(przewidywania_kody_test_dev0[0])\n", "print(len(przewidywania_kody_test_dev0[0]))\n", "przewidywania_etykiety_test_dev0 = zamien_przewidziane_kody_na_etykiety(przewidywania_kody_test_dev0)\n", "print(przewidywania_etykiety_test_dev0[0])\n", "print(len(przewidywania_etykiety_test_dev0[0]))\n", "\n", "print(test_dev0_labels[0])\n", "print(len(test_dev0_labels[0]))\n", "print(kody_etykiet_dev0[0])\n", "print(len(kody_etykiet_dev0[0]))" ] }, { "cell_type": "code", "execution_count": 82, "metadata": {}, "outputs": [], "source": [ "with open(\"dev-0/out.tsv\", \"w\", encoding=\"utf-8\") as uwu:\n", " for lista in przewidywania_etykiety_test_dev0:\n", " for etykieta in lista:\n", " uwu.write(str(etykieta) + \" \")\n", " uwu.write(str(\"\\n\"))" ] }, { "cell_type": "code", "execution_count": 83, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 230/230 [00:00<00:00, 278.11it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[0, 1, 1, 5, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 5, 8, 1, 5, 1, 5, 8, 6, 6, 1, 5, 1, 1, 1, 1, 1, 1, 7, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 8, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 8, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 0, 8, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 5, 8, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 0, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 8, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 0, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 5, 1, 1, 1, 7, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 4, 1, 6, 1, 5, 8, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n", "['O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'I-LOC', 'O', 'B-LOC', 'O', 'B-LOC', 'I-LOC', 'I-ORG', 'I-ORG', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'I-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'B-ORG', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'I-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'I-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'B-ORG', 'I-LOC', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'I-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'B-LOC', 'I-LOC', 'O', 'O', 'B-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'B-ORG', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'I-LOC', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'B-ORG', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'B-LOC', 'O', 'O', 'O', 'I-MISC', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'I-PER', 'O', 'I-ORG', 'O', 'B-LOC', 'I-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O']\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "\n" ] } ], "source": [ "przewidywania_kody_test_A = zwroc_przewidywania(test_A_tokens_ids)\n", "print(przewidywania_kody_test_A[0])\n", "przewidywania_etykiety_test_A = zamien_przewidziane_kody_na_etykiety(przewidywania_kody_test_A)\n", "print(przewidywania_etykiety_test_A[0])" ] }, { "cell_type": "code", "execution_count": 84, "metadata": {}, "outputs": [], "source": [ "with open(\"test-A/out.tsv\", \"w\", encoding=\"utf-8\") as uwu:\n", " for lista in przewidywania_etykiety_test_A:\n", " for etykieta in lista:\n", " uwu.write(str(etykieta) + \" \")\n", " uwu.write(str(\"\\n\"))" ] }, { "cell_type": "code", "execution_count": 85, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 945/945 [00:03<00:00, 273.52it/s]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "(0.9134328639027648, 0.919004869645874, 0.9162103952046085)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 945/945 [00:03<00:00, 289.35it/s]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[0, 5, 6, 2, 1, 1, 1, 2, 1, 1, 1, 5, 8, 1, 5, 1, 1, 1, 2, 6, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 2, 6, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 4, 1, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 5, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 3, 4, 1, 1, 1, 1, 2, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 5, 1, 3, 1, 1, 1, 1, 1, 0, 1, 1, 4, 1, 1, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 6, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 5, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0]\n", "['B-LOC', 'I-ORG', 'B-MISC', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'B-LOC', 'I-LOC', 'O', 'B-LOC', 'O', 'O', 'O', 'B-MISC', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'B-MISC', 'I-ORG', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'I-PER', 'O', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'B-PER', 'I-PER', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'B-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'B-LOC', 'O', 'B-PER', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'I-PER', 'O', 'O', 'I-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'I-ORG', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-PER', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-ORG', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'B-LOC', 'O', 'O', 'B-MISC', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O', 'O']\n" ] } ], "source": [ "print(eval_model(train_tokens_ids, train_labels, lstm))\n", "przewidywania_kody_test_train = zwroc_przewidywania(train_tokens_ids)\n", "print(przewidywania_kody_test_train[0])\n", "przewidywania_etykiety_test_train = zamien_przewidziane_kody_na_etykiety(przewidywania_kody_test_train)\n", "print(przewidywania_etykiety_test_train[0])" ] }, { "cell_type": "code", "execution_count": 86, "metadata": {}, "outputs": [], "source": [ "with open(\"train/out.tsv\", \"w\", encoding=\"utf-8\") as uwu:\n", " for lista in przewidywania_etykiety_test_train:\n", " for etykieta in lista:\n", " uwu.write(str(etykieta) + \" \")\n", " uwu.write(str(\"\\n\"))" ] } ], "metadata": { "author": "Jakub Pokrywka", "email": "kubapok@wmi.amu.edu.pl", "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "lang": "pl", "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.12.3" }, "subtitle": "11.NER RNN[ćwiczenia]", "title": "Ekstrakcja informacji", "year": "2021" }, "nbformat": 4, "nbformat_minor": 4 }