Automatically assigned DDC number: 005746
Manually assigned DDC number: 005436
Number of references: 8
Title: An Open Interface for Probabilistic Models of Text
Author:
Author:
Subject: John G. Cleary,W. J. Teahan An Open Interface for Probabilistic Models of Text
Description: An Application Program Interface (API) for modelling sequential text is described. The API is intended to shield the user from details of the modelling and probability estimation process. This should enable different implementations of models to be replaced transparently in application programs. The motivation for this API is work on the use of textual models for applications in addition to strict data compression, e.g. determination of the source of text, spelling correction or segmentation of text by inserting spaces. The API is probabilistic: that is, it supplies the probability of the next symbol in the sequence. It is general enough to deal accurately with models that include escapes for probabilities. The concepts abstracted by the API are explained together with details of the API calls.
Contributor: The Pennsylvania State University CiteSeer Archives
Publisher: unknown
Date: 1999-02-26
Pubyear: 1999
Format: ps
Identifier: http://citeseer.ist.psu.edu/152415.html
Source: http://www.cs.waikato.ac.nz/~wjt/papers/DCC99b.ps.gz
Language: en
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Rights: unrestricted
<?xml version="1.0" encoding="UTF-8"?>
<references_metadata>
<rec ID="/176301.html" Type="techreport" CiteSeer_Book="" CiteSeer_Volume="" Title="On-Line Stochastic Processes in Data Compression,">
<identifier Org="ISBN:0792376684" Paper_ID="/176301.html" Extracted="0792376684" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.5" />
<identifier Org="ISBN:1558605703" Paper_ID="/176301.html" Extracted="1558605703" DDC="651.5/0285574" Normalized_DDC="65150285574" Normalized_Weight="0.5" />
</rec>
<rec ID="/424258.html" Type="article" CiteSeer_Book="The Computer Journal" CiteSeer_Volume="40" Title="Semantically Motivated Improvements for {PPM} Variants,">
<identifier Org="ISBN:0387789081" Paper_ID="/424258.html" Extracted="0387789081" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.5" />
<identifier Org="ISBN:0792376684" Paper_ID="/424258.html" Extracted="0792376684" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.5" />
</rec>
<rec ID="/76182.html" Type="techreport" CiteSeer_Book="" CiteSeer_Volume="" Title="A block-sorting lossless data compression algorithm.,">
<identifier Org="ISBN:0126208611" Paper_ID="/76182.html" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0387301623" Paper_ID="/76182.html" Extracted="0387301623" DDC="518.103" Normalized_DDC="518103" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0471460540" Paper_ID="/76182.html" Extracted="0471460540" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0471484229" Paper_ID="/76182.html" Extracted="0471484229" DDC="006.6" Normalized_DDC="0066" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0780339576" Paper_ID="/76182.html" Extracted="0780339576" />
<identifier Org="ISBN:0780358589" Paper_ID="/76182.html" Extracted="0780358589" />
<identifier Org="ISBN:0821836269" Paper_ID="/76182.html" Extracted="0821836269" DDC="003/.54" Normalized_DDC="00354" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0849335566" Paper_ID="/76182.html" Extracted="0849335566" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0898713552" Paper_ID="/76182.html" Extracted="0898713552" DDC="519.4/0285/51" Normalized_DDC="5194028551" Normalized_Weight="0.0625" />
<identifier Org="ISBN:1846286026" Paper_ID="/76182.html" Extracted="1846286026" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.0625" />
<identifier Org="ISBN:1848000715" Paper_ID="/76182.html" Extracted="1848000715" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540234780" Paper_ID="/76182.html" Extracted="3540234780" DDC="004" Normalized_DDC="004" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540290699" Paper_ID="/76182.html" Extracted="3540290699" DDC="621.36/7" Normalized_DDC="621367" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540653856" Paper_ID="/76182.html" Extracted="3540653856" DDC="004.015118" Normalized_DDC="004015118" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540664084" Paper_ID="/76182.html" Extracted="3540664084" DDC="001.64" Normalized_DDC="00164" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540708804" Paper_ID="/76182.html" Extracted="3540708804" />
<identifier Org="ISBN:3540714944" Paper_ID="/76182.html" Extracted="3540714944" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540734368" Paper_ID="/76182.html" Extracted="3540734368" DDC="518" Normalized_DDC="518" Normalized_Weight="0.0625" />
<identifier Org="ISBN:9812565000" Paper_ID="/76182.html" Extracted="9812565000" DDC="621.382/2" Normalized_DDC="6213822" Normalized_Weight="0.0625" />
</rec>
<rec ID="/581790.html" Type="article" CiteSeer_Book="IEEE Transactions on Communications" CiteSeer_Volume="COM32" Title="Data compression using adaptive coding and partial string matching,">
<identifier Org="ISBN:0120121638" Paper_ID="/581790.html" Extracted="0120121638" />
<identifier Org="ISBN:0126208611" Paper_ID="/581790.html" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0387301623" Paper_ID="/581790.html" Extracted="0387301623" />
<identifier Org="ISBN:0387952608" Paper_ID="/581790.html" Extracted="0387952608" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0471460540" Paper_ID="/581790.html" Extracted="0471460540" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0471484229" Paper_ID="/581790.html" Extracted="0471484229" DDC="006.6" Normalized_DDC="0066" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0792390857" Paper_ID="/581790.html" Extracted="0792390857" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0849314909" Paper_ID="/581790.html" Extracted="0849314909" DDC="004" Normalized_DDC="004" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:089871611X" Paper_ID="/581790.html" Extracted="089871611X" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1584884657" Paper_ID="/581790.html" Extracted="1584884657" DDC="621.384" Normalized_DDC="621384" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540001700" Paper_ID="/581790.html" Extracted="3540001700" DDC="005.1" Normalized_DDC="0051" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540263209" Paper_ID="/581790.html" Extracted="3540263209" DDC="006.3/7" Normalized_DDC="00637" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:354066887X" Paper_ID="/581790.html" Extracted="354066887X" DDC="003/.54" Normalized_DDC="00354" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540755292" Paper_ID="/581790.html" Extracted="3540755292" DDC="005.52" Normalized_DDC="00552" Normalized_Weight="0.08333333333333333" />
</rec>
<rec ID="/7158.html" Type="article" CiteSeer_Book="The Computer Journal" CiteSeer_Volume="40" Title="Unbounded Length Contexts for {PPM},">
<identifier Org="ISBN:0120121638" Paper_ID="/7158.html" Extracted="0120121638" />
<identifier Org="ISBN:0123744261" Paper_ID="/7158.html" Extracted="0123744261" DDC="004.05" Normalized_DDC="00405" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0126208611" Paper_ID="/7158.html" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0769523153" Paper_ID="/7158.html" Extracted="0769523153" DDC="006.7" Normalized_DDC="0067" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0780385608" Paper_ID="/7158.html" Extracted="0780385608" DDC="621.382" Normalized_DDC="621382" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0818681322" Paper_ID="/7158.html" Extracted="0818681322" DDC="003/.54" Normalized_DDC="00354" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:1402072317" Paper_ID="/7158.html" Extracted="1402072317" />
<identifier Org="ISBN:1595933395" Paper_ID="/7158.html" Extracted="1595933395" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:1605660949" Paper_ID="/7158.html" Extracted="1605660949" DDC="621.382" Normalized_DDC="621382" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540401970" Paper_ID="/7158.html" Extracted="3540401970" DDC="004" Normalized_DDC="004" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540403116" Paper_ID="/7158.html" Extracted="3540403116" DDC="006.4015116" Normalized_DDC="0064015116" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540625925" Paper_ID="/7158.html" Extracted="3540625925" DDC="511.3" Normalized_DDC="5113" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540664084" Paper_ID="/7158.html" Extracted="3540664084" DDC="001.64" Normalized_DDC="00164" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540732802" Paper_ID="/7158.html" Extracted="3540732802" />
</rec>
<rec ID="/9675.html" Type="misc" CiteSeer_Book="" CiteSeer_Volume="" Title="Modelling English Text,">
<identifier Org="ISBN:0769523153" Paper_ID="/9675.html" Extracted="0769523153" DDC="006.7" Normalized_DDC="0067" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0792376684" Paper_ID="/9675.html" Extracted="0792376684" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1402012160" Paper_ID="/9675.html" Extracted="1402012160" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1558605703" Paper_ID="/9675.html" Extracted="1558605703" DDC="651.5/0285574" Normalized_DDC="65150285574" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1558607900" Paper_ID="/9675.html" Extracted="1558607900" DDC="025.00285" Normalized_DDC="02500285" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540204091" Paper_ID="/9675.html" Extracted="3540204091" DDC="004" Normalized_DDC="004" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540234780" Paper_ID="/9675.html" Extracted="3540234780" DDC="004" Normalized_DDC="004" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540252959" Paper_ID="/9675.html" Extracted="3540252959" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540294147" Paper_ID="/9675.html" Extracted="3540294147" DDC="004" Normalized_DDC="004" Normalized_Weight="0.1111111111111111" />
</rec>
<rec ID="/10230.html" Type="inproceedings" CiteSeer_Book="Designs Codes and Cryptography" CiteSeer_Volume="" Title="Models of English Text,">
<identifier Org="ISBN:0780399277" Paper_ID="/10230.html" Extracted="0780399277" />
<identifier Org="ISBN:0792376684" Paper_ID="/10230.html" Extracted="0792376684" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="1.0" />
</rec>
<rec ID="/33736.html" Type="inproceedings" CiteSeer_Book="Data Compression Conference" CiteSeer_Volume="" Title="Correcting English Text Using {PPM} Models,">
<identifier Org="ISBN:0780399277" Paper_ID="/33736.html" Extracted="0780399277" />
<identifier Org="ISBN:1869402790" Paper_ID="/33736.html" Extracted="1869402790" DDC="079/.94/08999442" Normalized_DDC="0799408999442" Normalized_Weight="1.0" />
</rec>
<rec ID="SELF" Type="SELF" CiteSeer_Book="SELF" CiteSeer_Volume="SELF" Title="An Open Interface for Probabilistic Models of Text" />
</references_metadata>