Automatically assigned DDC number: 005746
Manually assigned DDC number: 005746
Number of references: 4
Title: Symbol Ranking Text Compression
Author:
Subject: Peter Fenwick Symbol Ranking Text Compression
Description: In his work on the information content of English text in 1951, Shannon described a method of recoding the input text, a technique which has apparently lain dormant for the ensuing 45 years. Whereas traditional compressors exploit symbol frequencies and symbol contexts, Shannon's method adds the concept of "symbol ranking", as in `the next symbol is the one 3rd most likely in the present context'. This report describes an implementation of his method and shows that it forms the basis of a good text compressor. 1 The recent "acb" compressor of Buynovsky is shown to belong to the general class of symbol ranking compressors. Keywords text compression, Shannon, symbol ranking 1 This report has been submitted as a paper to the Journal of Universal Computer Science. It is available by anonymous ftp from ftp.cs.auckland.ac.nz /out/peter-f/TechRep132 1. Introduction In 1951 C.E. Shannon published his classic paper on the information content of English text, establishing the well-known bo...
Contributor: The Pennsylvania State University CiteSeer Archives
Publisher: unknown
Date: 1996-09-13
Pubyear: 1996
Format: ps
Identifier: http://citeseer.ist.psu.edu/148490.html
Source: http://www.cs.aukuni.ac.nz/~techrep/TR132/doc.ps.Z
Language: en
Relation:
Relation:
Relation:
Relation:
Rights: unrestricted
<?xml version="1.0" encoding="UTF-8"?>
<references_metadata>
<rec ID="/76182.html" Type="techreport" CiteSeer_Book="" CiteSeer_Volume="" Title="A block-sorting lossless data compression algorithm.,">
<identifier Org="ISBN:0120121638" Paper_ID="/76182.html" Extracted="0120121638" />
<identifier Org="ISBN:0126208611" Paper_ID="/76182.html" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0387301623" Paper_ID="/76182.html" Extracted="0387301623" DDC="518.103" Normalized_DDC="518103" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0471460540" Paper_ID="/76182.html" Extracted="0471460540" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0471484229" Paper_ID="/76182.html" Extracted="0471484229" DDC="006.6" Normalized_DDC="0066" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0769512062" Paper_ID="/76182.html" Extracted="0769512062" />
<identifier Org="ISBN:0780339576" Paper_ID="/76182.html" Extracted="0780339576" />
<identifier Org="ISBN:0780358589" Paper_ID="/76182.html" Extracted="0780358589" />
<identifier Org="ISBN:0821836269" Paper_ID="/76182.html" Extracted="0821836269" DDC="003/.54" Normalized_DDC="00354" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0849335566" Paper_ID="/76182.html" Extracted="0849335566" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:1846286026" Paper_ID="/76182.html" Extracted="1846286026" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:1848000715" Paper_ID="/76182.html" Extracted="1848000715" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540290699" Paper_ID="/76182.html" Extracted="3540290699" DDC="621.36/7" Normalized_DDC="621367" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540653856" Paper_ID="/76182.html" Extracted="3540653856" DDC="004.015118" Normalized_DDC="004015118" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540664084" Paper_ID="/76182.html" Extracted="3540664084" DDC="001.64" Normalized_DDC="00164" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540708804" Paper_ID="/76182.html" Extracted="3540708804" />
<identifier Org="ISBN:3540734368" Paper_ID="/76182.html" Extracted="3540734368" DDC="518" Normalized_DDC="518" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:9812565000" Paper_ID="/76182.html" Extracted="9812565000" DDC="621.382/2" Normalized_DDC="6213822" Normalized_Weight="0.07692307692307693" />
</rec>
<rec ID="/57744.html" Type="misc" CiteSeer_Book="" CiteSeer_Volume="" Title="Experiments with a Block Sorting Text Compression Algorithm,">
<identifier Org="ISBN:0126208611" Paper_ID="/57744.html" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.5" />
<identifier Org="ISBN:0387789081" Paper_ID="/57744.html" Extracted="0387789081" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.5" />
</rec>
<rec ID="/18506.html" Type="article" CiteSeer_Book="JUCS Journal of Universal Computer Science" CiteSeer_Volume="1" Title="Differential {Ziv-Lempel} Text Compression,">
<identifier Org="ISBN:0126208611" Paper_ID="/18506.html" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.5" />
<identifier Org="ISBN:0387789081" Paper_ID="/18506.html" Extracted="0387789081" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.5" />
</rec>
<rec ID="/132768.html" Type="misc" CiteSeer_Book="" CiteSeer_Volume="" Title="Block-Sorting Text Compression --- Final Report,">
<identifier Org="ISBN:0126208611" Paper_ID="/132768.html" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.25" />
<identifier Org="ISBN:0387789081" Paper_ID="/132768.html" Extracted="0387789081" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.25" />
<identifier Org="ISBN:3540291180" Paper_ID="/132768.html" Extracted="3540291180" DDC="005.1" Normalized_DDC="0051" Normalized_Weight="0.25" />
<identifier Org="ISBN:3540664084" Paper_ID="/132768.html" Extracted="3540664084" DDC="001.64" Normalized_DDC="00164" Normalized_Weight="0.25" />
</rec>
<rec ID="SELF" Type="SELF" CiteSeer_Book="SELF" CiteSeer_Volume="SELF" Title="Symbol Ranking Text Compression">
<identifier Org="ISBN:0126208611" Paper_ID="SELF" Extracted="0126208611" DDC="006.7/6" Normalized_DDC="00676" Normalized_Weight="0.125" />
<identifier Org="ISBN:0387789081" Paper_ID="SELF" Extracted="0387789081" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.125" />
<identifier Org="ISBN:0792376684" Paper_ID="SELF" Extracted="0792376684" DDC="005.74/6" Normalized_DDC="005746" Normalized_Weight="0.125" />
<identifier Org="ISBN:1846286026" Paper_ID="SELF" Extracted="1846286026" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.125" />
<identifier Org="ISBN:1848000715" Paper_ID="SELF" Extracted="1848000715" DDC="005.746" Normalized_DDC="005746" Normalized_Weight="0.125" />
<identifier Org="ISBN:354043075X" Paper_ID="SELF" Extracted="354043075X" DDC="005.1" Normalized_DDC="0051" Normalized_Weight="0.125" />
<identifier Org="ISBN:3540662782" Paper_ID="SELF" Extracted="3540662782" DDC="006.4015116" Normalized_DDC="0064015116" Normalized_Weight="0.125" />
<identifier Org="ISBN:3540664084" Paper_ID="SELF" Extracted="3540664084" DDC="001.64" Normalized_DDC="00164" Normalized_Weight="0.125" />
</rec>
</references_metadata>