%!PS-Adobe-3.0
%%Creator: groff version 1.09
%%CreationDate: Mon Mar 20 11:24:29 1995
%%DocumentNeededResources: font Times-Bold
%%+ font Times-Italic
%%+ font Times-Roman
%%+ font Courier
%%DocumentSuppliedResources: procset grops 1.09 0
%%Pages: 21
%%PageOrder: Ascend
%%Orientation: Portrait
%%EndComments
%%BeginProlog
%%BeginResource: procset grops 1.09 0
/setpacking where{
pop
currentpacking
true setpacking
}if
/grops 120 dict dup begin
/SC 32 def
/A/show load def
/B{0 SC 3 -1 roll widthshow}bind def
/C{0 exch ashow}bind def
/D{0 exch 0 SC 5 2 roll awidthshow}bind def
/E{0 rmoveto show}bind def
/F{0 rmoveto 0 SC 3 -1 roll widthshow}bind def
/G{0 rmoveto 0 exch ashow}bind def
/H{0 rmoveto 0 exch 0 SC 5 2 roll awidthshow}bind def
/I{0 exch rmoveto show}bind def
/J{0 exch rmoveto 0 SC 3 -1 roll widthshow}bind def
/K{0 exch rmoveto 0 exch ashow}bind def
/L{0 exch rmoveto 0 exch 0 SC 5 2 roll awidthshow}bind def
/M{rmoveto show}bind def
/N{rmoveto 0 SC 3 -1 roll widthshow}bind def
/O{rmoveto 0 exch ashow}bind def
/P{rmoveto 0 exch 0 SC 5 2 roll awidthshow}bind def
/Q{moveto show}bind def
/R{moveto 0 SC 3 -1 roll widthshow}bind def
/S{moveto 0 exch ashow}bind def
/T{moveto 0 exch 0 SC 5 2 roll awidthshow}bind def
/SF{
findfont exch
[exch dup 0 exch 0 exch neg 0 0]makefont
dup setfont
[exch/setfont cvx]cvx bind def
}bind def
/MF{
findfont
[5 2 roll
0 3 1 roll
neg 0 0]makefont
dup setfont
[exch/setfont cvx]cvx bind def
}bind def
/level0 0 def
/RES 0 def
/PL 0 def
/LS 0 def
/PLG{
gsave newpath clippath pathbbox grestore
exch pop add exch pop
}bind def
/BP{
/level0 save def
1 setlinecap
1 setlinejoin
72 RES div dup scale
LS{
90 rotate
}{
0 PL translate
}ifelse
1 -1 scale
}bind def
/EP{
level0 restore
showpage
}bind def
/DA{
newpath arcn stroke
}bind def
/SN{
transform
.25 sub exch .25 sub exch
round .25 add exch round .25 add exch
itransform
}bind def
/DL{
SN
moveto
SN
lineto stroke
}bind def
/DC{
newpath 0 360 arc closepath
}bind def
/TM matrix def
/DE{
TM currentmatrix pop
translate scale newpath 0 0 .5 0 360 arc closepath
TM setmatrix
}bind def
/RC/rcurveto load def
/RL/rlineto load def
/ST/stroke load def
/MT/moveto load def
/CL/closepath load def
/FL{
currentgray exch setgray fill setgray
}bind def
/BL/fill load def
/LW/setlinewidth load def
/RE{
findfont
dup maxlength 1 index/FontName known not{1 add}if dict begin
{
1 index/FID ne{def}{ pop pop}ifelse
}forall
/Encoding exch def
dup/FontName exch def
currentdict end definefont pop
}bind def
/DEFS 0 def
/EBEGIN{
moveto
DEFS begin
}bind def
/EEND/end load def
/CNT 0 def
/level1 0 def
/PBEGIN{
/level1 save def
translate
div 3 1 roll div exch scale
neg exch neg exch translate
0 setgray
0 setlinecap
1 setlinewidth
0 setlinejoin
10 setmiterlimit
[] 0 setdash
/setstrokeadjust where{
pop
false setstrokeadjust
}if
/setoverprint where{
pop
false setoverprint
}if
newpath
/CNT countdictstack def
userdict begin
/showpage{} def
}bind def
/PEND{
clear
countdictstack CNT sub{end}repeat
level1 restore
}bind def
end def
/setpacking where{
pop
setpacking
}if
%%EndResource
%%IncludeResource: font Times-Bold
%%IncludeResource: font Times-Italic
%%IncludeResource: font Times-Roman
%%IncludeResource: font Courier
grops begin/DEFS 1 dict def DEFS begin/u{.001 mul}bind def end/RES 72
def/PL 792 def/LS false def/ENC0[/asciicircum/asciitilde/Scaron/Zcaron
/scaron/zcaron/Ydieresis/trademark/quotesingle/.notdef/.notdef/.notdef
/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef
/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef/.notdef
/.notdef/.notdef/space/exclam/quotedbl/numbersign/dollar/percent
/ampersand/quoteright/parenleft/parenright/asterisk/plus/comma/hyphen
/period/slash/zero/one/two/three/four/five/six/seven/eight/nine/colon
/semicolon/less/equal/greater/question/at/A/B/C/D/E/F/G/H/I/J/K/L/M/N/O
/P/Q/R/S/T/U/V/W/X/Y/Z/bracketleft/backslash/bracketright/circumflex
/underscore/quoteleft/a/b/c/d/e/f/g/h/i/j/k/l/m/n/o/p/q/r/s/t/u/v/w/x/y
/z/braceleft/bar/braceright/tilde/.notdef/quotesinglbase/guillemotleft
/guillemotright/bullet/florin/fraction/perthousand/dagger/daggerdbl
/endash/emdash/ff/fi/fl/ffi/ffl/dotlessi/dotlessj/grave/hungarumlaut
/dotaccent/breve/caron/ring/ogonek/quotedblleft/quotedblright/oe/lslash
/quotedblbase/OE/Lslash/.notdef/exclamdown/cent/sterling/currency/yen
/brokenbar/section/dieresis/copyright/ordfeminine/guilsinglleft
/logicalnot/minus/registered/macron/degree/plusminus/twosuperior
/threesuperior/acute/mu/paragraph/periodcentered/cedilla/onesuperior
/ordmasculine/guilsinglright/onequarter/onehalf/threequarters
/questiondown/Agrave/Aacute/Acircumflex/Atilde/Adieresis/Aring/AE
/Ccedilla/Egrave/Eacute/Ecircumflex/Edieresis/Igrave/Iacute/Icircumflex
/Idieresis/Eth/Ntilde/Ograve/Oacute/Ocircumflex/Otilde/Odieresis
/multiply/Oslash/Ugrave/Uacute/Ucircumflex/Udieresis/Yacute/Thorn
/germandbls/agrave/aacute/acircumflex/atilde/adieresis/aring/ae/ccedilla
/egrave/eacute/ecircumflex/edieresis/igrave/iacute/icircumflex/idieresis
/eth/ntilde/ograve/oacute/ocircumflex/otilde/odieresis/divide/oslash
/ugrave/uacute/ucircumflex/udieresis/yacute/thorn/ydieresis]def
/Courier@0 ENC0/Courier RE/Times-Roman@0 ENC0/Times-Roman RE
/Times-Italic@0 ENC0/Times-Italic RE/Times-Bold@0 ENC0/Times-Bold RE
%%EndProlog
%%Page: 0 1
%%BeginPageSetup
BP
%%EndPageSetup
/F0 12/Times-Bold@0 SF(Markup Reconsider)248.61 159 Q(ed)-.216 E/F1 10
/Times-Italic@0 SF(Darr)265.495 183 Q(ell R. Raymond)-.37 E -1.55 -.55
(Fr a)269.175 195 T(nk Wm. T).55 E(ompa)-.92 E/F2 10/Times-Roman@0 SF
(Department of Computer Science)238.93 213 Q(Uni)260.22 225 Q -.15(ve)
-.25 G(rsity of W).15 E(aterloo)-.8 E -.8(Wa)252.525 237 S
(terloo, Ontario, Canada).8 E(N2L 3G1)286.975 249 Q F1(Deric)280.04 273
Q 2.5(kW)-.2 G(ood)-3.42 E F2(Department of Computer Science)238.93 291
Q(Uni)245.64 303 Q -.15(ve)-.25 G(rsity of W).15 E(estern Ontario)-.8 E
(London, Ontario, Canada)255.175 315 Q(N6A 5B7)286.695 327 Q F1(ABSTRA)
282.535 375 Q(CT)-.3 E F2 1.796 -.8(We d)181 402.6 T .196
(escribe some of the implications of markup for document man-).8 F .88
(agement systems.)156 414.6 R(Markup')5.88 E 3.38(sp)-.55 G .88
(roperties are inherited from te)-3.38 F .88(xt, since it is)-.15 F
1.625(embedded in te)156 426.6 R 4.125(xt. These)-.15 F 1.626
(properties are most adv)4.125 F 1.626(antageous when docu-)-.25 F 2.811
(ment structure is reducible to substrings of characters, and when the)
156 438.6 R .231(update characteristics of the structure are similar to\
the update characteris-)156 450.6 R 1.027(tics of the te)156 462.6 R
3.527(xt. W)-.15 F 3.526(ed)-.8 G 1.026
(escribe situations in which these characteristics are)-3.526 F(disadv)
156 474.6 Q 3.035(antageous. Markup)-.25 F .535(is not a data model, b)
3.035 F .536(ut one of se)-.2 F -.15(ve)-.25 G .536(ral possible).15 F
.699(techniques for representing structure.)156 486.6 R -.15(Fo)5.699 G
3.199(rt).15 G .699(his reason it should not be the)-3.199 F
(foundation of document management systems.)156 498.6 Q(20 March 1995)
126 546.6 Q .32 LW 198 626.2 126 626.2 DL/F3 8/Times-Roman@0 SF .111
(This paper w)126 638 R .11(as presented at the First International W)
-.08 F .11(orkshop on Principles of Document Pro-)-.64 F(cessing, W)126
648 Q(ashington DC, October 21-23, 1992.)-.64 E EP
%%Page: 1 2
%%BeginPageSetup
BP
%%EndPageSetup
/F0 12/Times-Bold@0 SF(Markup Reconsider)248.61 159 Q(ed)-.216 E/F1 10
/Times-Italic@0 SF(Darr)265.495 183 Q(ell R. Raymond)-.37 E -1.55 -.55
(Fr a)269.175 195 T(nk Wm. T).55 E(ompa)-.92 E/F2 10/Times-Roman@0 SF
(Department of Computer Science)238.93 213 Q(Uni)260.22 225 Q -.15(ve)
-.25 G(rsity of W).15 E(aterloo)-.8 E -.8(Wa)252.525 237 S
(terloo, Ontario, Canada).8 E(N2L 3G1)286.975 249 Q F1(Deric)280.04 273
Q 2.5(kW)-.2 G(ood)-3.42 E F2(Department of Computer Science)238.93 291
Q(Uni)245.64 303 Q -.15(ve)-.25 G(rsity of W).15 E(estern Ontario)-.8 E
(London, Ontario, Canada)255.175 315 Q(N6A 5B7)286.695 327 Q/F3 10
/Times-Bold@0 SF 2.5(1. Intr)126 363 R(oduction.)-.18 E F2 3.245(As)126
378.6 S .745(ound theory of document management systems requires a good\
understanding of the)-3.245 F .299(role of markup.)126 390.6 R .298
(Markup is the use of embedded codes, kno)5.298 F .298
(wn as tags, to describe a doc-)-.25 F(ument')126 402.6 Q 2.54(ss)-.55 G
.041(tructure, or to embed instructions that can be used by a layout pr\
ocessor or other)-2.54 F .787(document management tools.)126 414.6 R
.787(Markup is ubiquitous, b)5.787 F .787
(ut its properties as a form of data)-.2 F 1.131(representation ha)126
426.6 R 1.431 -.15(ve n)-.2 H 1.132
(ot been studied by the computer science community).15 F 6.132(.M)-.65 G
1.132(arkup has)-6.132 F(recei)126 438.6 Q -.15(ve)-.25 G 2.5(da).15 G
(ttention lar)-2.5 E(gely in the conte)-.18 E
(xt of document standards or implementations.)-.15 E .059(There are se)
126 454.2 R -.15(ve)-.25 G .059
(ral reasons to consider markup as an independent phenomenon.).15 F .058
(The \214rst is)5.058 F 2.268(that it is perv)126 466.2 R(asi)-.25 E
-.15(ve)-.25 G 4.769(;w).15 G(here)-4.769 E -.15(ve)-.25 G 4.769(rt).15
G -.15(ex)-4.769 G 4.769(ti).15 G 4.769(su)-4.769 G 2.269
(sed as a type of data, markup is lik)-4.769 F 2.269(ely to be)-.1 F
(emplo)126 478.2 Q 2.525(yed. This)-.1 F .024
(usage includes not only traditional online and of)2.525 F .024
(\215ine documents, b)-.25 F .024(ut also)-.2 F 1.541(programming-langu\
age source code, command languages, macro languages, te)126 490.2 R
(xt-based)-.15 E .953(protocols, and other sequential information.)126
502.2 R .952(The second reason to study markup is that)5.953 F .816(our\
current understanding of it is bound to the operations of markup proce\
ssors; that is,)126 514.2 R .809(we usually e)126 526.2 R .809
(xplain a tag')-.15 F 3.309(sf)-.55 G .808
(unction by describing the operation of the processor for that)-3.309 F
3.57(tag. W)126 538.2 R 3.57(ek)-.8 G(no)-3.57 E 3.57(wt)-.25 G 1.07(ha\
t in other areas of computer science, operational descriptions of phe-)
-3.57 F .212(nomena are not suf)126 550.2 R 2.712(\214cient[8]. As)-.25
F 2.712(ar)2.712 G .212(esult, man)-2.712 F 2.712(ye)-.15 G .211
(xisting document systems and standards)-2.862 F 1.3(are idiosyncratic \
and application-dependent, and do not appear to be founded on suf)126
562.2 R<8c2d>-.25 E 1.302(ciently general principles[18].)126 574.2 R
3.802(At)6.302 G 1.302
(hird reason is that a better understanding of markup)-3.802 F .544
(might help us to clarify e)126 586.2 R .544(xactly ho)-.15 F 3.044(wd)
-.25 G .544(ocument systems dif)-3.044 F .545
(fer from traditional databases.)-.25 F -1.25 -.7(Te x)126 598.2 T 2.641
(ta).7 G .141(ppears to be quite dif)-2.641 F .141
(ferent from numbers, and markup seems an unlik)-.25 F .14
(ely candidate)-.1 F 1.275(for structuring accounting databases, b)126
610.2 R 1.275(ut these are observ)-.2 F 1.275
(ations of established practice,)-.25 F 1.147
(not of theoretical limits.)126 622.2 R 1.147(If te)6.147 F 1.147
(xt is dif)-.15 F 1.147(ferent from traditional data, it w)-.25 F 1.146
(ould be useful to)-.1 F .32 LW 198 630.2 126 630.2 DL/F4 8
/Times-Roman@0 SF .111(This paper w)126 642 R .11
(as presented at the First International W)-.08 F .11
(orkshop on Principles of Document Pro-)-.64 F(cessing, W)126 652 Q
(ashington DC, October 21-23, 1992.)-.64 E EP
%%Page: 2 3
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(2)126 66 Q .56
(\214nd some fundamental reasons for that dif)126 120 R .56
(ference, and a better understanding of markup)-.25 F
(may help us to identify them.)126 132 Q .289(In what follo)126 147.6 R
.289(ws, we de)-.25 F -.15(ve)-.25 G .289
(lop some of the aspects of a theory of markup, independently of).15 F
.031(particular implementations or standards.)126 159.6 R 1.631 -.8
(We b)5.031 H -.15(eg).8 G .031(in by characterizing te).15 F(xt')-.15 E
2.531(sp)-.55 G .031(roperties as a)-2.531 F .762
(system of symbols. Since markup is embedded in te)126 171.6 R .762
(xt, it inherits man)-.15 F 3.262(yo)-.15 G 3.262(ft)-3.262 G -.15(ex)
-3.262 G(t').15 E 3.262(sp)-.55 G(roper)-3.262 E(-)-.2 E 3.723(ties. Ne)
126 183.6 R 1.223(xt we consider ho)-.15 F 3.723(ws)-.25 G 1.223
(ome of markup')-3.723 F 3.724(sp)-.55 G 1.224
(roblems are a result of these inherited)-3.724 F .219
(properties, and hence not easily a)126 195.6 R -.2(vo)-.2 G 2.718
(ided. Finally).2 F 2.718(,w)-.65 G 2.718(eb)-2.718 G .218(rie\215y e)
-2.718 F .218(xplore ho)-.15 F 2.718(wd)-.25 G .218(ocument man-)-2.718
F 1.196(agement systems dif)126 207.6 R 1.196
(fer from traditional databases, and consider ho)-.25 F 3.696(wm)-.25 G
1.196(arkup addresses)-3.696 F(these unique needs.)126 219.6 Q/F1 10
/Times-Bold@0 SF 2.5(2. What)126 243.6 R(is markup?)2.5 E F0 .908
(What we think of as te)126 259.2 R .908(xt is irretrie)-.15 F -.25(va)
-.25 G .907(bly bound to the processes used to create it and to).25 F
.822(access it.)126 271.2 R -1.11(Va)5.822 G .822
(rious types of markup ha)1.11 F 1.122 -.15(ve b)-.2 H .822(een in).15 F
-.15(ve)-.4 G .823(nted to support these processes.).15 F(His-)5.823 E
(torically)126 283.2 Q 3.392(,t)-.65 G .892
(he most important processor of documents has been the human reader)
-3.392 F 5.891(.T)-.55 G(hus,)-5.891 E .164
(the earliest types of markup were designed to f)126 295.2 R .164
(acilitate the reading process.)-.1 F .164(In consonan-)5.164 F .02
(tal scripts, for e)126 307.2 R .02(xample, diacritics were emplo)-.15 F
.02(yed to signify v)-.1 F .02(ocalic distinctions[9].)-.2 F(Punc-)5.02
E .295(tuation, w)126 319.2 R .295(ord di)-.1 F .295
(vision, and sentence di)-.25 F .295
(vision are a type of markup adopted to pro)-.25 F .295(vide the)-.15 F
.82(reader with clues about emphasis, or)126 331.2 R -.05(ga)-.18 G .82
(nization, and breathing.).05 F .82(These f)5.82 F .82(actors may seem)
-.1 F(secondary to the content of the te)126 343.2 Q(xt, b)-.15 E
(ut note that:)-.2 E 2.901(It probably also mak)151 358.8 R 2.901
(es a dif)-.1 F 2.901(ference whether in Jo)-.25 F(yce')-.1 E(s)-.55 E
/F2 10/Times-Italic@0 SF(Ulysses)5.401 E F0 2.901(one of)5.401 F 1.607
(Stephen Dedalus' \214rst thoughts is `No mother' \(as in printed v)151
370.8 R 1.607(ersions\) or)-.15 F
(`No, mother' \(as in the manuscript\)[32].)151 382.8 Q 2.055
(Punctuation symbols are in such common use that the)126 398.4 R 4.556
(ys)-.15 G 2.056(eem themselv)-4.556 F 2.056(es part of the)-.15 F .144
(alphabet, and so seem part of the content of the te)126 410.4 R 2.643
(xt. Another)-.15 F .143(early type of markup to aid)2.643 F .693(readi\
ng is illumination, the graphical embellishment of important characters\
in medie)126 422.4 R -.25(va)-.25 G(l).25 E 4.272
(manuscripts. Illumination)126 434.4 R(serv)4.272 E 1.772(es a decorati)
-.15 F 2.072 -.15(ve p)-.25 H 1.772(urpose, b).15 F 1.772
(ut it also identi\214es important)-.2 F .909(breaks in the te)126 446.4
R .909(xt, such as ne)-.15 F 3.409(wc)-.25 G .909(hapters and sections.)
-3.409 F -.15(Pa)5.909 G .91(ge furniture\212headers, footers,).15 F(an\
d page numbers\212is another type of markup that helps to orient the re\
ader)126 458.4 Q(.)-.55 E(Lik)126 474 Q 2.551(es)-.1 G .051
(peech, documents purport to describe the w)-2.551 F .051
(orld or tell a story)-.1 F 5.05(.U)-.65 G(nlik)-5.05 E 2.55(es)-.1 G
.05(peech, ho)-2.55 F(w-)-.25 E -2.15 -.25(ev e)126 486 T 1.225 -.4
(r, d).25 H .425(ocuments are considered objects in their o).4 F .426
(wn right, separate from the speak)-.25 F(er)-.1 E 2.926(,a)-.4 G(nd)
-2.926 E .25(so are often themselv)126 498 R .249
(es a subject for documentation[13].)-.15 F .249
(This property of documents led)5.249 F 1.073(to a second class of mark\
up, namely critical commentaries of the `main' content.)126 510 R(This)
6.074 E 2.698(class of markup includes mar)126 522 R 2.698
(ginalia, footnotes, and other e)-.18 F 2.697(xplanatory meta-content.)
-.15 F 2.375(Scholarly documents mak)126 534 R 4.875(ee)-.1 G(xtensi)
-5.025 E 2.675 -.15(ve u)-.25 H 2.375
(se of critical commentaries. Some editions of).15 F .619(ancient w)126
546 R .619(orks are so hea)-.1 F .619(vily mark)-.2 F .619
(ed up that the main content is only a small fraction of)-.1 F
(the total information.)126 558 Q .293(The adv)126 573.6 R .293(ent of \
book making and the consequent specialization of the writing, editing, \
and)-.15 F .901
(book-production crafts led to a third class of markup: editor')126
585.6 R 3.401(sa)-.55 G .9(nd printer')-3.401 F 3.4(sm)-.55 G .9
(arks. This)-3.4 F .42
(class of markup supports `out-of-band' communication between writer)126
597.6 R 2.92(,e)-.4 G(ditor)-2.92 E 2.92(,a)-.4 G .42(nd book-)-2.92 F
(mak)126 609.6 Q(er)-.1 E 2.686(,a)-.4 G .186
(nd can be thought of as a kind of critical commentary on the document')
-2.686 F 2.686(sp)-.55 G(roduc-)-2.686 E .938
(tion, to be read at the ne)126 621.6 R .939
(xt stage of the production process.)-.15 F .939
(Production markup is typi-)5.939 F 1.055(cally applied directly to man\
uscripts or proofs, usually with coloured pens and a set of)126 633.6 R
(symbols agreed upon by con)126 645.6 Q -.15(ve)-.4 G(ntion.).15 E EP
%%Page: 3 4
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(3)481 66 Q .534(The \214rst generation of onlin\
e typesetting systems adopted embedded markup to commu-)126 120 R 2.119
(nicate layout instructions from the human to the machine.)126 132 R
2.118(Since the primiti)7.118 F 2.418 -.15(ve i)-.25 H(nput).15 E(de)126
144 Q 1.001(vices of the time did not support colour or arbitrary glyph\
s, markup and content w)-.25 F(as)-.1 E .246(entered in the same input \
stream, using the same alphabet, and markup w)126 156 R .246
(as distinguished)-.1 F .885(by special pre\214x)126 168 R .885
(es and suf)-.15 F<8c78>-.25 E 3.385(es. Most)-.15 F .886
(computer typesetting systems still use embedded)3.385 F
(commands to control document production.)126 180 Q .342
(Currently markup')126 195.6 R 2.842(se)-.55 G -.2(vo)-3.092 G .342
(lution is dri).2 F -.15(ve)-.25 G 2.842(nb).15 G 2.842(yt)-2.842 G .542
-.1(wo b)-2.842 H .342(asic requirements.).1 F .341
(First, the requirement)5.342 F .08(for multiple presentations of a te)
126 207.6 R .08
(xt has resulted in markup becoming an indirect speci\214ca-)-.15 F .686
(tion of presentation.)126 219.6 R .685
(Rather than denoting speci\214c layout instructions for document ele-)
5.686 F .907(ments, markup of design elements identi\214es members of s\
peci\214c layout classes that are)126 231.6 R .069
(mapped to a speci\214c presentation through a style sheet.)126 243.6 R
.068(Markup of design elements \(such)5.068 F .472(as the)126 255.6 R/F1
10/Times-Italic@0 SF(-ms)2.972 E F0 .472(macros for)2.972 F F1(tr)2.972
E(of)-.45 E(f)-.18 E F0 .473(and L)2.973 F/F2 8/Times-Roman@0 SF(A)-2.24
-1.5 M F0(T)-1 1.5 M(E)-1.6 2 M 2.973(Xm)-1.5 -2 O .473(acros for T)
-2.973 F(E)-1.6 2 M .473(X\) f)-1.5 -2 N .473
(acilitate layout parameterization.)-.1 F 2.142(Second, the idea that d\
ocuments can be treated as databases has resulted in markup)126 267.6 R
.974(assuming a role as representation for data elements, f)126 279.6 R
.975(acilitating automatic querying and)-.1 F 2.5(updating. Markup)126
291.6 R(thus plays an important role in identifying structure.)2.5 E
3.204(In modern use, there are se)126 307.2 R -.15(ve)-.25 G 3.204
(ral recognized subcate).15 F 3.204(gories of markup.)-.15 F F1
(Descriptive)8.204 E F0 .083
(markup identi\214es a logical structure in a document[7].)126 319.2 R
(Descripti)5.083 E .384 -.15(ve m)-.25 H .084(arkup is usually dis-).15
F 1.375(tinguished from)126 331.2 R F1(pr)3.875 E(ocedur)-.45 E(al)-.15
E F0 1.375(markup, in which tags are mapped to actions of a speci\214c)
3.875 F(de)126 343.2 Q 2.599(vice. Markup)-.25 F .099(that is not restr\
icted to a single application, style, or formatting system is)2.599 F
(kno)126 355.2 Q .998(wn as)-.25 F F1 -.1(ge)3.498 G(ner).1 E(alized)
-.15 E F0 3.498(markup[10]. Generalized)3.498 F .998(and descripti)3.498
F 1.298 -.15(ve m)-.25 H .998(arkup are often tak).15 F(en)-.1 E 2.724
(to be synon)126 367.2 R 5.224(ymous. Recently)-.15 F 5.224(,m)-.65 G
2.724(arkup adv)-5.224 F 2.724(ocates ha)-.2 F 3.024 -.15(ve s)-.2 H
2.724(uggested a useful separation).15 F .125(between procedural and)126
379.2 R F1(declar)2.625 E(ative)-.15 E F0 .124
(markup, where the former describes an operation and)2.625 F .633
(the latter describes a constraint.)126 391.2 R(The)5.634 E 3.134(ya)
-.15 G .634(lso separate)-3.134 F F1(pr)3.134 E(esentational)-.37 E F0
(and)3.134 E F1(analytic)3.134 E F0(markup;)3.134 E .185(the former is \
markup that describes appearance, and the latter is markup that describ\
es an)126 403.2 R(ontology for the document.)126 415.2 Q 1.378
(What commonalities e)126 430.8 R 1.379
(xist between punctuation, critical commentaries, printer')-.15 F 3.879
(sm)-.55 G(arks,)-3.879 E .41(typesetting commands, and structural tags\
? The essential characteristic of all these forms)126 442.8 R .552
(of structure is that the)126 454.8 R 3.053(ya)-.15 G .553
(re simultaneously)-3.053 F F1(embedded)3.053 E F0(and)3.053 E F1(separ)
3.053 E(able)-.15 E F0 3.053(;t)C(he)-3.053 E 3.053(ya)-.15 G .553
(re part of the)-3.053 F(te)126 466.8 Q
(xt, yet distinguishable from it.)-.15 E .384
(Structure can be either strongly or weakly embedded.)126 482.4 R .383
(In either case, the structure is pre-)5.384 F .538
(sent in the data; the dif)126 494.4 R .538
(ference is that for strongly embedded structure, its position in the)
-.25 F .768(data is information bearing.)126 506.4 R .768(An e)5.768 F
.768(xample of strongly embedded tags is found in the fol-)-.15 F(lo)126
518.4 Q(wing te)-.25 E(xt:)-.15 E/F3 10/Courier@0 SF 2.286
(now is the time for all good men)151 546 R
(to come to the aid of the party)151 558 Q F0 .667
(These tags demarcate a speci\214c w)126 585.6 R .667(ord in the te)-.1
F .667(xt and assign that w)-.15 F .667(ord to a cate)-.1 F(gory)-.15 E
5.666(.A)-.65 G(n)-5.666 E -.15(ex)126 597.6 S
(ample of a weakly embedded tag is the follo).15 E(wing:)-.25 E F3 1.6
(now is the time for all good men to)151 625.2 R
(come to the aid of the party)151 637.2 Q EP
%%Page: 4 5
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(4)126 66 Q .356(The tag)126 120 R/F1 10
/Courier@0 SF .356()2.856 F F0 .356(is informati)2.856 F
-.15(ve)-.25 G 2.856(,b).15 G .356(ut its location within the te)-3.056
F .355(xt is not informa-)-.15 F .095(tion bearing; in this e)126 132 R
.095(xample, it could be placed at an)-.15 F 2.595(yp)-.15 G .095
(oint in the te)-2.595 F .095(xt, or e)-.15 F -.15(ve)-.25 G 2.595(no)
.15 G .095(utside it,)-2.595 F 1.153(without losing its meaning.)126 144
R 1.152(The test for strongly embedded markup is: Can the tag be)6.152 F
(mo)126 156 Q -.15(ve)-.15 G 3.29(dt).15 G 3.29(os)-3.29 G .79
(ome other position in the te)-3.29 F .79
(xt without loss of information?)-.15 F .79(If it cannot, then)5.79 F
(the tag is strongly embedded.)126 168 Q/F2 10/Times-Italic@0 SF 1.194
(In normal use)126 183.6 R 3.694(,`)-.1 G 1.194(markup' means str)-3.694
F 1.193(ongly embedded structur)-.45 F(e)-.37 E F0 3.693(,a)C 1.193
(nd the remainder of our)-3.693 F 2.288
(discussion focuses on the properties of this kind of markup.)126 195.6
R 2.289(De\214nitions are al)7.289 F -.1(wa)-.1 G(ys).1 E .45
(debatable, b)126 207.6 R .45
(ut we will treat this one as both necessary and suf)-.2 F .45
(\214cient; an)-.25 F .45(ything that is not)-.15 F .883(embedded and s\
eparable is not markup, and being embedded and separable is suf)126
219.6 R(\214cient)-.25 E 1.431(for something to be markup.)126 231.6 R
1.431(Note, therefore, that we do not require a structure to be)6.431 F
(descripti)126 243.6 Q -.15(ve)-.25 G 2.504(,o).15 G 2.504(rc)-2.504 G
(onte)-2.504 E .005(xt-free, or nested, or distinguishable by means of \
unique start and end)-.15 F .761(characters, in order to be markup.)126
255.6 R .761(These are all properties of speci\214c forms of markup,)
5.761 F(rather than characteristic of markup in general.)126 267.6 Q
3.372(Aw)126 283.2 S .873(ord should be said about so-called)-3.472 F F2
(out-of-line)3.373 E F0 .873(markup, non-embedded structure that)3.373 F
2.88(conforms to the syntactic requirements of a gi)126 295.2 R -.15(ve)
-.25 G 5.38(nm).15 G 2.88(arkup standard[2].)-5.38 F(Out-of-line)7.88 E
.207(markup is not markup by our de\214nition, b)126 307.2 R .207
(ut readers can choose the terminology the)-.2 F 2.708(yp)-.15 G(re-)
-2.708 E .758
(fer; we intend merely to distinguish between internal and e)126 319.2 R
.758(xternal structure.)-.15 F .758(While out-)5.758 F .297
(of-line markup does not suf)126 331.2 R .298
(fer from some of the disadv)-.25 F .298
(antages that we shall discuss, nei-)-.25 F 1.52
(ther does it share the adv)126 343.2 R 1.52
(antages of strongly embedded markup, and is more properly)-.25 F
(considered a speci\214c type of e)126 355.2 Q(xternal structure.)-.15 E
.262(In addition to describing what markup is, it is important to note \
what markup is not.)126 370.8 R .262(It is)5.262 F 1.034(not a computat\
ional automaton, a data model, or a mathematical formalism.)126 382.8 R
1.034(It is not a)6.034 F 1.113(computational automaton, because it doe\
s not by itself specify the input, the output, or)126 394.8 R .497
(the beha)126 406.8 R .497(viour of an)-.2 F 2.997(ya)-.15 G .497
(bstract de)-2.997 F 2.997(vice. It)-.25 F .496
(is not a data model, because it does not by itself)2.997 F 2.039(denot\
e classes of data, operations on those classes, or constraints on v)126
418.8 R 2.04(alid instances.)-.25 F(Finally)126 430.8 Q 2.509(,i)-.65 G
2.509(ti)-2.509 G 2.508(sn)-2.509 G .008(ot a mathematical formalism, b\
ecause it is not accompanied by a set of rules)-2.508 F 1.026
(that describes ho)126 442.8 R 3.526(wi)-.25 G 3.526(tc)-3.526 G 1.026
(an be manipulated.)-3.526 F 1.026
(Markup is, instead, simply the denotation of)6.026 F .864
(speci\214c positions in a te)126 454.8 R .864
(xt with some assigned tok)-.15 F 3.363(ens. It)-.1 F .863
(is fully dependent on e)3.363 F(xternal)-.15 E .163
(information for meaning.)126 466.8 R .164
(In most document management systems that emplo)5.163 F 2.664(ym)-.1 G
.164(arkup, a)-2.664 F 2.71(computational de)126 478.8 R 2.71
(vice \(usually a pushdo)-.25 F 2.71
(wn automaton\) is implemented as a w)-.25 F 2.71(ay of)-.1 F .852
(embedding a mathematical formalism \(usually a conte)126 490.8 R .853
(xt-free grammar\) in a system that)-.15 F 2.55(recognizes te)126 502.8
R 2.55(xts containing structure \(usually indicated by the presence of \
markup\).)-.15 F(Clearly)126 514.8 Q 3.227(,i)-.65 G 3.227(ti)-3.227 G
3.228(sp)-3.227 G .728(ossible to ha)-3.228 F 1.028 -.15(ve t)-.2 H .728
(he formalism \(and the implied data model\) without either).15 F 1.075
(the computational de)126 526.8 R 1.075(vice or the markup.)-.25 F 1.074
(Markup thus belongs not to the w)6.074 F 1.074(orld of for)-.1 F(-)-.2
E 1.325(malisms, b)126 538.8 R 1.325(ut to the w)-.2 F 1.325
(orld of representations; its properties of interest are those of an)-.1
F(y)-.15 E(data structure.)126 550.8 Q/F3 10/Times-Bold@0 SF 2.5(3. The)
126 574.8 R(pr)2.5 E(operties of text.)-.18 E F0(Markup')126 590.4 Q
3.123(sp)-.55 G .623(roperties are lar)-3.123 F .623(gely deri)-.18 F
-.25(va)-.25 G(ti).25 E .922 -.15(ve o)-.25 H 3.122(ft).15 G .622
(he properties of the documents in which it)-3.122 F .085(is embedded.)
126 602.4 R .085(Thus, it is w)5.085 F .086(orthwhile to re)-.1 F(vie)
-.25 E 2.586(ws)-.25 G .086(ome of the basic properties of documents.)
-2.586 F .005(In the follo)126 614.4 R .005(wing, we restrict ourselv)
-.25 F .005(es to the properties of te)-.15 F .004
(xt, particularly to te)-.15 F .004(xts as the)-.15 F(y)-.15 E .04
(are usually represented in computers.)126 626.4 R .041(It w)5.041 F
.041(ould be interesting to de)-.1 F -.15(ve)-.25 G .041
(lop a theory of docu-).15 F .095(ments that w)126 638.4 R .095
(ould include such things as paintings and gestures, b)-.1 F .094
(ut we will not attempt to)-.2 F(do so here.)126 650.4 Q EP
%%Page: 5 6
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(5)481 66 Q .141(The class of te)126 120 R .141
(xt is an important subclass of the general f)-.15 F .142
(amily of sign systems.)-.1 F -1.25 -.7(Te x)5.142 H .142(ts are).7 F
.677(constructed from atomic elements kno)126 132 R .677
(wn as characters.)-.25 F 3.177(As)5.677 G .676
(et of such characters consti-)-3.177 F .696(tutes an alphabet.)126 144
R .697(Alphabets partition the possible set of inscriptions; an inscrip\
tion can)5.696 F .657(belong to at most one character in an alphabet.)
126 156 R(Moreo)5.657 E -.15(ve)-.15 G 1.457 -.4(r, i).15 H 3.157(ti).4
G 3.157(st)-3.157 G .657(he case that the le)-3.157 F -.15(ve)-.25 G
3.157(lo).15 G(f)-3.157 E .184(discrimination needed to mak)126 168 R
2.684(es)-.1 G .185(uch distinctions is \214nite[11].)-2.684 F .185
(The number of equi)5.185 F -.25(va)-.25 G(lence).25 E .27
(classes de\214ned by an alphabet is al)126 180 R -.1(wa)-.1 G .269
(ys \214nite, b).1 F .269(ut can v)-.2 F .269(ary in size.)-.25 F .269
(The Roman alphabet)5.269 F(de\214nes 26 characters, whereas the Chines\
e alphabet de\214nes 50,000 or more.)126 192 Q(Indi)126 207.6 Q 1.283
(vidual characters by themselv)-.25 F 1.283(es are rarely suf)-.15 F
1.284(\214cient communications.)-.25 F 1.284(An essential)6.284 F .291(\
feature of a system of writing is that it supports the creation of comp\
ound e)126 219.6 R .29(xpressions by)-.15 F 2.171
(means of character combinations[12].)126 231.6 R 2.171(Most te)7.171 F
2.171(xts use relati)-.15 F 2.471 -.15(ve p)-.25 H 2.171
(ositioning to produce).15 F .307
(these combinations; characters are placed ne)126 243.6 R .307
(xt to one another)-.15 F 2.807(,a)-.4 G .307
(nd a collection of charac-)-2.807 F .316
(ters that share proximity is treated as a unit.)126 255.6 R .317
(Exceptions to this principle are situations in)5.317 F .196
(which multiple characters occup)126 267.6 R 2.696(yt)-.1 G .195
(he same position; for e)-2.696 F .195
(xample, the use of diacritics for)-.15 F(accenting, or the use of o)126
279.6 Q -.15(ve)-.15 G(rstrik).15 E
(es in arti\214cial languages such as APL.\207)-.1 E 1.002
(Symbol systems that emplo)126 295.2 R 3.502(yd)-.1 G 1.002
(iscrete characters and relati)-3.502 F 1.303 -.15(ve o)-.25 H 1.003
(rdering ha).15 F 1.303 -.15(ve a)-.2 H 3.503(tl).15 G 1.003(east four)
-3.503 F 1.62(classes of properties: resources, granularity)126 307.2 R
4.12(,o)-.65 G(rder)-4.12 E 4.12(,a)-.4 G 1.62(nd update.)-4.12 F 1.62
(These four classes are)6.62 F(some)126 319.2 Q .439
(what interdependent, b)-.25 F .439
(ut we present them separately for the purposes of e)-.2 F(xposition.)
-.15 E/F1 10/Times-Bold@0 SF(Resour)126 334.8 Q(ces)-.18 E F0 3.612(.T)C
1.112(he resources of a te)-3.612 F 1.111(xt are the ra)-.15 F 3.611(wm)
-.15 G 1.111(aterials of which it is constructed: its)-3.611 F 1.095
(symbol set and the space in which the symbol set is laid out.)126 346.8
R 1.095(Resources are important)6.095 F .961(because the)126 358.8 R
3.461(ya)-.15 G .961(re scarce; there are neither an in\214nite number \
of symbols nor is there an)-3.461 F .604(in\214nite amount of space.)126
370.8 R .604(In order to create ne)5.604 F 3.104(ww)-.25 G .605
(ords, one must use some combination)-3.204 F .7(of e)126 382.8 R .7
(xisting symbols that requires space.)-.15 F .7
(Resources are also important because installing)5.7 F 1.76
(them and reading them requires ef)126 394.8 R 1.76(fort. Accordingly)
-.25 F 4.26(,i)-.65 G 4.26(nm)-4.26 G(an)-4.26 E 4.26(yl)-.15 G 1.76
(anguages the most fre-)-4.26 F(quently used w)126 406.8 Q
(ords are short.)-.1 E 1.4(The scarcity of resources af)126 422.4 R
1.399(fects electronic markup in the same w)-.25 F 1.399(ay that it af)
-.1 F 1.399(fects the)-.25 F 1.844(main te)126 434.4 R 1.844
(xt; it encourages bre)-.15 F(vity)-.25 E 6.844(.W)-.65 G 1.845
(here markup is added manually)-6.844 F 4.345(,t)-.65 G 1.845
(here is a strong)-4.345 F 1.047(desire to k)126 446.4 R 1.047(eep the \
most frequent forms of markup concise, so as to reduce input ef)-.1 F
(fort.)-.25 E(Ev)126 458.4 Q .051(en a v)-.15 F .052
(erbose markup scheme such as L)-.15 F/F2 8/Times-Roman@0 SF(A)-2.24
-1.5 M F0(T)-1 1.5 M(E)-1.6 2 M 2.552(Xh)-1.5 -2 O .052
(as commendably brief markup for mathe-)-2.552 F .562(matics and for so\
me frequently used codes, such as those for paragraph breaks.)126 470.4
R(Markup)5.562 E 3.06(minimization techniques in SGML are designed to r\
educe the space consumed by)126 482.4 R 1.206(markup, and the ef)126
494.4 R 1.206(fort in)-.25 F -.2(vo)-.4 G(lv).2 E 1.206
(ed in installing it.)-.15 F 1.206(Where markup is added automatically)
6.206 F(,)-.65 E .549(there is less need to w)126 506.4 R .549
(orry about input ef)-.1 F .549(fort, b)-.25 F .549(ut e)-.2 F -.15(ve)
-.25 G 3.05(nh).15 G .55(ere it is undesirable to be pro\215i-)-3.05 F
-.05(ga)126 518.4 S(te with markup, since it interferes with the readab\
ility of the underlying te).05 E(xt.)-.15 E F1(Granularity)126 534 Q F0
5.585(.G)C .585(ranularity is a measure of the po)-5.585 F .585
(wer to distinguish detail, or the le)-.25 F -.15(ve)-.25 G 3.085(lo).15
G(f)-3.085 E .671(atomicity of the system.)126 546 R .672
(The granularity of markup is no greater than that of the te)5.672 F
.672(xt in)-.15 F .155(which it is embedded; tags cannot demarcate more\
precisely than a single character)126 558 R 5.155(.T)-.55 G(his)-5.155
E 2.066(is important if one considers the alphabet to be a discrete sam\
pling of a continuous)126 570 R 2.539(medium. Phonetic)126 582 R .038
(alphabets are samplings of at least tw)2.539 F 2.538(oc)-.1 G .038
(ontinuous media\212speech and)-2.538 F 3.392(ideas. As)126 594 R .892
(in an)3.392 F 3.392(ys)-.15 G .892
(ampling process, an upper bound can be gi)-3.392 F -.15(ve)-.25 G 3.392
(nf).15 G .892(or the information in)-3.392 F 2.836
(the sampling, based on the frequenc)126 606 R 5.336(yo)-.15 G 5.336(ft)
-5.336 G 2.836(he samples.)-5.336 F 2.836(This bound may be further)
7.836 F(de)126 618 Q .89(graded if the samples are not well chosen.)-.15
F -.15(Fo)5.891 G 3.391(re).15 G .891
(xample, if the Roman alphabet were)-3.541 F .686
(accurately mapped to phonemes, there w)126 630 R .686
(ould be less need for the International Phonetic)-.1 F .32 LW 198 638
126 638 DL F2(\207Alternati)126 649.8 Q -.12(ve)-.2 G(ly).12 E 2(,i)-.52
G 2(ti)-2 G 2(sp)-2 G(ossible to re)-2 E -.04(ga)-.12 G(rd o).04 E -.12
(ve)-.12 G(rstrik).12 E(es as an e)-.08 E(xtension of the alphabet.)-.12
E EP
%%Page: 6 7
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(6)126 66 Q 1.395(Alphabet. W)126 120 R 3.895(ew)
-.8 G 1.395(ould ha)-3.995 F 1.695 -.15(ve a)-.2 H 1.395
(lphabetic distinctions \(rather than conte).15 F 1.396
(xtual ones\) for)-.15 F/F1 10/Times-Italic@0 SF(sow)3.896 E F0 .184
(\(female pig\) and)126 132 R F1(sow)2.684 E F0 .184
(\(to plant\), and there w)2.684 F .184(ould be no need for lig)-.1 F
.183(atures to represent cer)-.05 F(-)-.2 E 1.892(tain v)126 144 R -.25
(ow)-.2 G 1.892(el combinations, as in).25 F F1(h\346morr)4.393 E -.1
(age)-.15 G F0(or)4.493 E F1(p\346leozoic)4.393 E F0 6.893(.T)C 1.893
(he potential for mismatch)-6.893 F 1.218(between w)126 156 R 1.218
(ords and ideas is e)-.1 F 1.218(vident in the dif)-.25 F 1.218
(ference in precision of w)-.25 F 1.218(ords used in the)-.1 F
(social sciences compared to those used in the natural sciences[17].)126
168 Q .41(Granularity af)126 183.6 R .41(fects markup in tw)-.25 F 2.91
(ow)-.1 G 2.91(ays. Markup')-3.01 F 2.91(sa)-.55 G .41
(bility to distinguish structure is ulti-)-2.91 F .184
(mately limited by the le)126 195.6 R -.15(ve)-.25 G 2.684(lo).15 G
2.684(fd)-2.684 G .184(istinction that the te)-2.684 F .184
(xt itself pro)-.15 F .183(vides; tags can do no more)-.15 F 1.127
(than de\214ne superclasses of the atomic elements already in the te)126
207.6 R 3.627(xt. Second,)-.15 F 1.127(markup is)3.627 F 1.03(itself te)
126 219.6 R 1.03(xt, and so itself e)-.15 F 1.029(xhibits granularity)
-.15 F 6.029(.T)-.65 G 1.029(he number of tags and the rules for their)
-6.029 F(combination also constitute a fundamental limit on the e)126
231.6 Q(xpressi)-.15 E .3 -.15(ve p)-.25 H -.25(ow).15 G(er of markup.)
.25 E/F2 10/Times-Bold@0 SF(Order)126 247.2 Q F0 6.261(.O)C 1.261
(rder in te)-6.261 F 1.261(xt, as we ha)-.15 F 1.561 -.15(ve o)-.2 H
(bserv).15 E 1.261(ed, serv)-.15 F 1.262
(es to redress the limitation of a small)-.15 F 1.119
(alphabet by permitting position-dependent combination of characters.)
126 259.2 R -1.25 -.7(Te x)6.119 H 3.619(ti).7 G 3.618(sg)-3.619 G
(enerally)-3.618 E .494(ordered linearly)126 271.2 R 2.994(,a)-.65 G
2.994(sas)-2.994 G .494(ingle stream of characters.)-2.994 F .494
(This order is used because for most of)5.494 F .025(the history of te)
126 283.2 R .025
(xts, the processor has been a human being, reproducing the te)-.15 F
.024(xt as speech.)-.15 F .811(The reproduction order of te)126 295.2 R
.812(xt is a total order; e)-.15 F -.15(ve)-.25 G .812
(ry element in the te).15 F .812(xt is ordered with)-.15 F .337
(respect to e)126 307.2 R -.15(ve)-.25 G .337(ry other).15 F 5.337(.M)
-.55 G(oreo)-5.337 E -.15(ve)-.15 G 1.137 -.4(r, t).15 H .337
(his order is achie).4 F -.15(ve)-.25 G 2.837(di).15 G 2.837(na)-2.837 G
(relati)-.001 E -.15(ve)-.25 G 2.836(,r).15 G .336(ather than an abso-)
-2.836 F .043(lute f)126 319.2 R .043(ashion; that is, e)-.1 F -.15(ve)
-.25 G .043(ry atomic element is related to just tw).15 F 2.544(oo)-.1 G
.044(thers \(its predecessor and)-2.544 F 1.811(its successor\).)126
331.2 R 1.811
(Documents that are not primarily intended to be rendered into speech)
6.811 F 1.542(often contain non-linear elements, such as tables, mar)126
343.2 R 1.543(ginalia, cross-references, aligned)-.18 F
(translations, and footnotes.)126 355.2 Q 1.108
(In electronic uses, order typically serv)126 370.8 R 1.107
(es as the controlling sequence of markup access;)-.15 F .107(the marku\
p processor encounters the markup in the order in which it occurs when \
the te)126 382.8 R(xt)-.15 E .398(is consulted in reproduction order)126
394.8 R 5.398(.T)-.55 G .398
(hus, typesetting markup is usually found ne)-5.398 F .397(xt to the)
-.15 F .697(document element whose presentation it modi\214es.)126 406.8
R .698(Markup systems can also rely on the)5.697 F .75
(total order to indicate substructure in the markup; for e)126 418.8 R
.75(xample, paired tags that are con-)-.15 F .003(tained within some ot\
her tag pair are usually considered to be nested within the latter pair)
126 430.8 R(.)-.55 E(In this case, the total order is vie)126 442.8 Q
(wed as a depth-\214rst tra)-.25 E -.15(ve)-.2 G
(rsal of the implied hierarch).15 E -.65(y.)-.05 G F2(Update)126 458.4 Q
F0 3.492(.T)C .992(he properties discussed so f)-3.492 F .992(ar ha)-.1
F 1.292 -.15(ve b)-.2 H .991(een static ones.).15 F .991(Electronic te)
5.991 F .991(xt also has)-.15 F 2.366(speci\214c dynamic properties.)126
470.4 R 2.366(There are tw)9.866 F 4.866(oi)-.1 G 2.366
(mportant update characteristics of te)-4.866 F(xt,)-.15 E(deri)126
482.4 Q -.15(ve)-.25 G 3.23(df).15 G .73(rom the order of the te)-3.23 F
.729(xt and its redundanc)-.15 F 4.529 -.65(y. O)-.15 H .729
(rder in the te).65 F .729(xt is speci\214ed in a)-.15 F(relati)126
494.4 Q .777 -.15(ve f)-.25 H .477(ashion; this means that the insertio\
n of characters can be done by breaking only).05 F .43
(the relationship between the tw)126 506.4 R 2.93(oa)-.1 G .43
(djacent characters that surround the insertion point; all)-2.93 F .26
(other characters simply maintain their relati)126 518.4 R .56 -.15
(ve p)-.25 H 2.76(osition.\207 The).15 F .26(inserted fragment no)2.76 F
2.76(wp)-.25 G(ar)-2.76 E(-)-.2 E .125(ticipates in an ordering relatio\
nship with all other characters in the te)126 530.4 R .125
(xt, and does so with-)-.15 F(out the need for transiti)126 542.4 Q .3
-.15(ve s)-.25 H(peci\214cation of these relationships.).15 E 1.139
(The second update characteristic is due to the inherent redundanc)126
558 R 3.638(yo)-.15 G 3.638(ft)-3.638 G -.15(ex)-3.638 G 3.638(t. In).15
F 1.138(order to)3.638 F 1.537(update a gi)126 570 R -.15(ve)-.25 G
4.037(nw).15 G 1.537(ord \(for instance, to change its spelling\), it i\
s necessary to locate all)-4.137 F 1.016(copies of the w)126 582 R 1.016
(ord and change them each indi)-.1 F(vidually)-.25 E 6.016(.T)-.65 G
1.015(he standard representation for)-6.016 F(te)126 594 Q .167
(xt, then, maintains position information as concisely as possible, b)
-.15 F .168(ut k)-.2 F .168(eeps man)-.1 F 2.668(yc)-.15 G(opies)-2.668
E(of an)126 606 Q 2.5(yg)-.15 G -2.15 -.25(iv e)-2.5 H 2.5(nw).25 G
(ord.)-2.6 E .32 LW 198 614 126 614 DL/F3 8/Times-Roman@0 SF .207
(\207While not literally true in most te)126 625.8 R .207
(xt editor implementations, this is the illusion the)-.12 F 2.207(ys)
-.12 G(upport.)-2.207 E .257(The actual implementation of insertion oft\
en requires that the positions of all of the succeed-)126 635.8 R .127
(ing characters are actually updated, because the)126 645.8 R 2.127(ya)
-.12 G .127(re stored in absolute order rather than rela-)-2.127 F(ti)
126 655.8 Q .24 -.12(ve o)-.2 H(rder).12 E(.)-.44 E EP
%%Page: 7 8
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(7)481 66 Q .265
(Markup inherits its update characteristics from te)126 120 R 2.765
(xt. The)-.15 F .265(insertion of a tag into a te)2.765 F .265(xt is a)
-.15 F(relati)126 132 Q .831 -.15(ve u)-.25 H .531(pdate that attaches \
to the tag all the dependencies that are implied by that loca-).15 F
.464(tion \(for e)126 144 R .464(xample, it may become a member of all \
the tag pairs that surround it\), without)-.15 F .548
(the need to specify them e)126 156 R(xplicitly)-.15 E 5.548(.T)-.65 G
.549(he property of redundanc)-5.548 F 3.049(yi)-.15 G 3.049(sa)-3.049 G
.549(lso present; in order)-3.049 F .066(to change a tag')126 168 R
2.566(sn)-.55 G .065(ame it is necessary to locate all copies of the ta\
g and change them indi-)-2.566 F(vidually)126 180 Q 7.112(.R)-.65 G
(edundanc)-7.112 E 4.612(ym)-.15 G(ak)-4.612 E 2.112(es con)-.1 F -.15
(ve)-.4 G 2.113(rting presentational markup to descripti).15 F 2.413
-.15(ve m)-.25 H(arkup).15 E(dif)126 192 Q(\214cult, since each instanc\
e of presentation must be separately considered.)-.25 E .696
(The four classes of properties interact in roughly the follo)126 207.6
R .696(wing manner:)-.25 F 3.196(Ad)5.696 G .696(esired le)-3.196 F -.15
(ve)-.25 G(l).15 E 1.51(of granularity determines a set of atomic e)126
219.6 R 1.51(xpressions, kno)-.15 F 1.51(wn as an alphabet, and also)
-.25 F .343(determines the rules for creating compound e)126 231.6 R
2.842(xpressions. The)-.15 F .342(alphabet, the rules, and the)2.842 F
.956(medium are collecti)126 243.6 R -.15(ve)-.25 G .956
(ly the resources at the disposal of an author).15 F 5.956(.T)-.55 G
.957(hese resources are)-5.956 F 1.675(used in creating a te)126 255.6 R
4.174(xt. The)-.15 F(te)4.174 E 1.674
(xt is ordered and redundant, and therefore has speci\214c)-.15 F
(update characteristics.)126 267.6 Q/F1 10/Times-Bold@0 SF 2.5
(4. Implications)126 291.6 R -.25(fo)2.5 G 2.5(rm).25 G(arkup.)-2.5 E F0
.589(The properties of te)126 307.2 R .589(xt bear on markup')-.15 F
3.089(sd)-.55 G .589(esign and use.)-3.089 F .59
(These properties are also at the)5.589 F .652
(root of the more widely kno)126 319.2 R .652(wn problems with markup.)
-.25 F 2.252 -.8(We n)5.652 H 1.152 -.25(ow c).8 H .652
(onsider some of these).25 F(problems in more detail.)126 331.2 Q .095
(As mentioned earlier)126 346.8 R 2.595(,t)-.4 G .095
(he resources of a te)-2.595 F .095
(xt are its symbols and its positions.)-.15 F .096(Markup, as)5.096 F
2.21(embedded te)126 358.8 R 2.21
(xt, consumes both symbols and positions.)-.15 F 2.21
(Consider the consumption of)7.21 F 3.173(symbols. In)126 370.8 R .673
(order to be part of a te)3.173 F .674(xt, markup must use te)-.15 F
.674(xtual symbols.)-.15 F .674(In order to be)5.674 F .201
(separable from the te)126 382.8 R .201
(xt, something must \215ag the distinction between markup and content.)
-.15 F .354(One approach to separability is to partition the character \
set, choosing markup characters)126 394.8 R .166
(from one subset and content characters from another)126 406.8 R 5.165
(.P)-.55 G .165(artitioning is widely used to sepa-)-5.315 F .601
(rate punctuation characters from alphabetic characters.)126 418.8 R
-.15(Pa)5.601 G .601(rtitioning is also used in some).15 F .14
(popular w)126 430.8 R .139(ord processors that k)-.1 F .139
(eep `hidden' bytes, chosen from outside the ASCII charac-)-.1 F .687
(ter set, to store formatting information.)126 442.8 R 2.287 -.8(We m)
5.687 H .687(ight call partitioning).8 F/F2 10/Times-Italic@0 SF(lo)
3.188 E(go)-.1 E(gr)-.1 E(aphic)-.15 E F0(markup,)3.188 E 1.762(since i\
t resembles logographic writing systems in allocating a unique symbol t\
o each)126 454.8 R(`w)126 466.8 Q 3.592(ord'. In)-.1 F 1.092
(both cases the disadv)3.592 F 1.093
(antage is clear; logographic systems require lar)-.25 F 1.093(ge, and)
-.18 F(possibly unbounded, alphabets.)126 478.8 Q .394(The more usual a\
pproach to separability is to use the same character set for both marku\
p)126 494.4 R .435(and content, b)126 506.4 R .435
(ut to isolate markup and content in separate streams or modes.)-.2 F
.435(Modes can)5.435 F 1.437(be identi\214ed in se)126 518.4 R -.15(ve)
-.25 G 1.437(ral w).15 F 1.437(ays; for e)-.1 F 1.437
(xample, one might maintain e)-.15 F 1.436(xternal structures that)-.15
F 1.048(indicate which parts of the te)126 530.4 R 1.048
(xt are content and which are markup.)-.15 F 1.048(The more common)6.048
F .112(approach, ho)126 542.4 R(we)-.25 E -.15(ve)-.25 G .912 -.4(r, i)
.15 H 2.612(st).4 G 2.612(oa)-2.612 G .111
(llocate a small number of characters \(or character sequences\) to)
-2.612 F 1.073(indicate a mode switch.)126 554.4 R 1.073
(This approach is adopted because it is supportable by parsers.)6.073 F
1.423(Dedicating e)126 566.4 R -.15(ve)-.25 G 3.923(no).15 G 1.423
(ne character to mode switching is irritating, ho)-3.923 F(we)-.25 E
-.15(ve)-.25 G 2.222 -.4(r, s).15 H 1.422(ince it seems).4 F(ine)126
578.4 Q 1.078
(vitable that such characters need to appear as content occasionally)
-.25 F 6.079(.T)-.65 G 1.079(hus, an escape)-6.079 F .915
(technique must be used \(typically)126 590.4 R 3.415(,d)-.65 G .915
(oubling the mode switch character or using another)-3.415 F .894(chara\
cter as an escape indicator\) to \215ag that the mode switch character \
should be inter)126 602.4 R(-)-.2 E .659(preted as a literal.)126 614.4
R .659(Escape sequences must themselv)5.659 F .658
(es be escapable, and so on.)-.15 F(Though)5.658 E 1.036(no formal dif)
126 626.4 R 1.037(\214culties are raised by this technique, fe)-.25 F
3.537(ws)-.25 G 1.037(ystems implement it \215a)-3.537 F(wlessly)-.15 E
(.)-.65 E .091(UNIX users, for e)126 638.4 R .091(xample, are f)-.15 F
.091(amiliar with the dilemma of trying to determine ho)-.1 F 2.59(wm)
-.25 G(an)-2.59 E(y)-.15 E 2.613
(quotes and backslashes are needed to protect a command line ar)126
650.4 R 2.614(gument from shell)-.18 F EP
%%Page: 8 9
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(8)126 66 Q 2.727(interpretation. Another)126 120
R -.15(ex)2.727 G .227(ample is the C++ template f).15 F(acility)-.1 E
2.727(.A)-.65 G .226(template parameter list is)-.001 F
(bounded by angle brack)126 132 Q
(ets, and no spaces are necessary in constructs lik)-.1 E(e:)-.1 E/F1 10
/Courier@0 SF(template class set;)151 147.6 Q -4
(set a_set;)151 159.6 R F0 .797
(If the parameter list itself contains a template, ho)126 175.2 R(we)
-.25 E -.15(ve)-.25 G 1.597 -.4(r, t).15 H .797(hen a space).4 F/F2 10
/Times-Italic@0 SF(is)3.298 E F0 .798(required to help)3.298 F
(the system distinguish the end brack)126 187.2 Q(ets:)-.1 E F1
(set >)151 202.8 Q(a_set_of_sets;)16 E F0 2.5(At)126 218.4 S
(hird e)-2.5 E(xample might be SGML)-.15 E 1.1 -.55('s r)-.92 H
(ecord separator problem.).55 E 1.158
(The resource of positions can also result in problems. If the te)126
234 R 1.158(xt does not permit o)-.15 F -.15(ve)-.15 G -.2(r-).15 G
(strik)126 246 Q .27
(es, then there can be at most one character at each position.)-.1 F .27
(Positions thus become a)5.27 F .157(scarce commodity)126 258 R 2.657
(,e)-.65 G .156
(specially for situations in which more than one tag ought to occup)
-2.657 F 2.656(ya)-.1 G .141(single position.)126 270 R .141
(In a descripti)7.641 F .441 -.15(ve m)-.25 H .141(arkup system, for e)
.15 F .142(xample, it is usual to demarcate the)-.15 F 1.018
(start and end of a te)126 282 R 1.018
(xt fragment with tags that correspond to its element type.)-.15 F 1.017
(If a te)6.017 F(xt)-.15 E .325
(fragment belongs to more than one element type, ho)126 294 R(we)-.25 E
-.15(ve)-.25 G 1.125 -.4(r, o).15 H .325(ne is f).4 F .325
(aced with the problem)-.1 F .642(of putting tw)126 306 R 3.142(oo)-.1 G
3.142(rm)-3.142 G .641(ore tags at the same position in the te)-3.142 F
3.141(xt. Some)-.15 F .641(possible taggings for)3.141 F
(such a situation include:)126 318 Q 18.06(\(i\) -)227.9 348 R 2.5
(-------)2.5 G()-2.5 E 15.28(\(ii\) -)227.9 360 R 2.5
(-------)2.5 G()-2.5 E 12.5(\(iii\) - - - - - - - -)2.5 E 1.709
(The \214rst solution identi\214es the fragment as both an X and a Y)126
393.6 R 4.21(,b)-1.29 G 1.71(ut cannot be distin-)-4.41 F .416
(guished from a nesting of the tw)126 405.6 R 2.915(oe)-.1 G 2.915
(lements. The)-2.915 F .415(second solution is distinguishable from)
2.915 F .94(nesting, b)126 417.6 R .94(ut is not conte)-.2 F 3.44
(xt-free. Neither)-.15 F .94(of the \214rst tw)3.44 F 3.44(os)-.1 G .94
(olutions is rob)-3.44 F .94(ust to insertions)-.2 F .286
(between and , since the)126 429.6 R 2.786(yw)-.15 G .286
(ill change the relationship from coincidence to o)-2.786 F -.15(ve)-.15
G -.2(r-).15 G .264(lap. The third solution combines the tw)126 441.6 R
2.765(oe)-.1 G .265(lements, is distinguishable from nesting, and is)
-2.765 F(rob)126 453.6 Q .071(ust to the problem of insertions.)-.2 F
(Ho)5.071 E(we)-.25 E -.15(ve)-.25 G .871 -.4(r, i).15 H 2.571(tr).4 G
.071(equires a local o)-2.571 F -.15(ve)-.15 G .07
(rriding of the order of).15 F 1.382(the te)126 465.6 R 1.382
(xt, since the order of the identi\214ers X and Y must be immaterial.)
-.15 F 1.383(In ef)6.383 F 1.383(fect, this)-.25 F .218
(de\214nes an equi)126 477.6 R -.25(va)-.25 G .217
(lence class consisting of the tags and .).25 F .217
(The third solution)5.217 F .179
(is thus a form of logographic markup, since we are e)126 489.6 R .18
(xtending the alphabet to include ne)-.15 F(w)-.25 E(equi)126 501.6 Q
-.25(va)-.25 G(lence classes of characters.).25 E 1.403
(Consumption of positions has other deleterious ef)126 517.2 R 3.903
(fects. Embedded)-.25 F 1.402(tags can af)3.903 F 1.402(fect an)-.25 F
(y)-.15 E 1.08(search based on relati)126 529.2 R 1.38 -.15(ve p)-.25 H
1.08(osition, such as proximity or re).15 F 1.08(gular e)-.15 F 1.08
(xpression search.)-.15 F -.8(Ta)6.08 G(gs).8 E .992
(can in\215ate the distance between tw)126 541.2 R 3.492(ot)-.1 G -.15
(ex)-3.492 G 3.491(tf).15 G .991(ragments so that the)-3.491 F 3.491(yf)
-.15 G .991(all outside the bounds)-3.591 F .334
(speci\214ed for a proximity search; if tags appear within w)126 553.2 R
.334(ords \(consider markup of diacrit-)-.1 F 1.934(ics or lig)126 565.2
R 1.933(atures, as in representing)-.05 F 10.263 -4.165(\250u b)5.268 H
(y)4.165 E F1(ü)4.433 E F0 4.433(\)t)C(he)-4.433 E 4.433(yc)-.15 G
1.933(an defeat re)-4.433 F 1.933(gular e)-.15 F(xpression)-.15 E .885
(searching that does not tak)126 577.2 R 3.385(et)-.1 G .885
(he markup into account, so that a search for)-3.385 F F1(f.r)3.386 E F0
(matches)3.386 E F2(for)126 589.2 Q F0(,)A F2<8c72>3.495 E F0(,)A F2
(far)3.495 E F0(and)3.495 E F2(fur)3.495 E F0 3.495(,b)C .995(ut not)
-3.695 F F2 .555<66a8>3.495 G(ur)-4.44 E F0 5.995(.T)C .994
(he insertion of tags also af)-5.995 F .994(fects document processing)
-.25 F 1.947(systems that rely on absolute positions.)126 601.2 R 1.948
(One consequence is that documents that are)6.947 F(mark)126 613.2 Q
.053(ed up `on the \215y' must k)-.1 F .053
(eep track of the original positions of the te)-.1 F .052
(xt in order to pro-)-.15 F 3.171(vide useful error messages[16].)126
625.2 R 3.171(Some documents cannot be modi\214ed by inserting)8.171 F
1.15(markup because their absolute positions are inde)126 637.2 R -.15
(xe)-.15 G 3.65(db).15 G 3.65(yo)-3.65 G 1.15(ther tools in the en)-3.65
F(vironment.)-.4 E 1.522(An important e)126 649.2 R 1.523
(xample is program source code, in which characters' positions may be)
-.15 F EP
%%Page: 9 10
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(9)481 66 Q(kno)126 120 Q .719(wn by deb)-.25 F
.719(uggers, syntax-directed editors, code pro\214lers, compilers, and \
source code)-.2 F(control systems.)126 132 Q 1.687(Let us no)126 147.6 R
4.188(wl)-.25 G 1.688
(ook at the implications of granularity for markup.)-4.188 F 1.688
(Because it shares the)6.688 F(data')126 159.6 Q 3.408(sr)-.55 G .907(e\
presentation, markup is bound to the granularity of the representation:\
it shares)-3.408 F 1.015(the data')126 171.6 R 3.515(sl)-.55 G -2.15
-.25(ev e)-3.515 H 3.515(lo).25 G 3.515(fd)-3.515 G 3.515
(iscreteness. The)-3.515 F 1.015(chief ef)3.515 F 1.015
(fect of granularity is to mak)-.25 F 3.516(ei)-.1 G 3.516(td)-3.516 G
(if)-3.516 E 1.016(\214cult to)-.25 F -.15(ex)126 183.6 S 1.057
(press structure that is not a subset of character positions in the te)
.15 F 3.557(xt. Thematic)-.15 F(struc-)3.557 E 1.286(tures are one e)126
195.6 R 1.286(xample; Hamlet may ha)-.15 F 1.586 -.15(ve m)-.2 H 1.286
(oments of indecisi).15 F -.15(ve)-.25 G 1.286(ness, b).15 F 1.287
(ut these are not)-.2 F 1.548
(well correlated with unique character sequences in the te)126 207.6 R
1.547(xt of the play[28].)-.15 F(Thematic)6.547 E .383(structure, lik)
126 219.6 R 2.883(em)-.1 G(an)-2.883 E 2.883(yc)-.15 G(ate)-2.883 E .384
(gories, is de\214ned not by a set of necessary and suf)-.15 F .384
(\214cient proper)-.25 F(-)-.2 E 1.001(ties, b)126 231.6 R 1.001
(ut instead by possessing a suf)-.2 F 1.001
(\214cient number of characteristics, none of which are)-.25 F .831
(essential[20, 3].)126 243.6 R .832
(Probabilistic or statistical information about the te)5.831 F .832
(xt is also unlik)-.15 F .832(ely to)-.1 F(ha)126 255.6 Q .915 -.15
(ve d)-.2 H .615(iscrete boundaries.).15 F .615(The position of mar)
5.615 F .615(ginalia and other non-sequential commen-)-.18 F .359
(tary is not precise to within a single character)126 267.6 R 5.359(.H)
-.55 G .359(igh le)-5.359 F -.15(ve)-.25 G 2.86(ls).15 G .36
(tructures are not al)-2.86 F -.1(wa)-.1 G .36(ys com-).1 F 1.164
(positions of lo)126 279.6 R 3.664(wl)-.25 G -2.15 -.25(ev e)-3.664 H
3.664(lf).25 G 1.164(eatures; people ha)-3.664 F 1.464 -.15(ve t)-.2 H
1.364 -.1(wo a).15 H 1.164(rms, b).1 F 1.164
(ut this is not a consequence of)-.2 F 1.309(their possession of tw)126
291.6 R 3.809(ok)-.1 G 1.309
(inds of cells, those that belong to arms and those that do not)-3.809 F
1.683(\(consider blood, nerv)126 303.6 R 1.683(es, lig)-.15 F 4.183
(aments\). In)-.05 F 1.682(general, structure is not al)4.183 F -.1(wa)
-.1 G 1.682(ys reducible to a).1 F(functional description of a system')
126 315.6 Q 2.5(ss)-.55 G(ubcomponents[23].)-2.5 E .708
(Granularity problems often sho)126 331.2 R 3.208(wu)-.25 G 3.208(pa)
-3.208 G 3.208(si)-3.208 G(ndeterminac)-3.208 E 3.208(yi)-.15 G 3.208
(na)-3.208 G .708(pplying descripti)-3.208 F 1.009 -.15(ve m)-.25 H .709
(arkup to).15 F .039(white space and punctuation.)126 343.2 R .039
(As these elements are themselv)5.039 F .038
(es markup \(though for a dif-)-.15 F .925(ferent function\), it is not\
surprising that there are problems in applying another le)126 355.2 R
-.15(ve)-.25 G 3.425(lo).15 G(f)-3.425 E .168(markup to them.)126 367.2
R .168(Sentences that end in full-stop abbre)5.168 F .168
(viations, for e)-.25 F .167(xample, will not ha)-.15 F -.15(ve)-.2 G
1.531(an e)126 379.2 R 1.531
(xtra full stop to signal the end of the sentence.)-.15 F 1.531
(If markup is used to identify the)6.531 F(abbre)126 391.2 Q .399
(viation, is the punctuation part of the abbre)-.25 F .398
(viation or part of the sentence?)-.25 F .398(If punc-)5.398 F .399
(tuation or white space is included within the entity)126 403.2 R 2.899
(,i)-.65 G 2.899(tm)-2.899 G .4(ay be erroneously remo)-2.899 F -.15(ve)
-.15 G 2.9(di).15 G 2.9(ft)-2.9 G(he)-2.9 E .588(entity is modi\214ed.)
126 415.2 R .587
(White space, when used as a delimiter for both markup and te)5.588 F
.587(xt, can)-.15 F .566(become confused if markup is treated as option\
al \(as in the case of SGML)126 427.2 R 1.666 -.55('s C)-.92 H(ONCUR\).)
.55 E(The interaction between punctuation and markup can also complicat\
e string searching.)126 439.2 Q 3.863(At)126 454.8 S 1.362
(hird class of dif)-3.863 F 1.362(\214culty arises from markup')-.25 F
3.862(si)-.55 G 1.362(nheritance of the te)-3.862 F(xt')-.15 E 3.862(so)
-.55 G(rder)-3.862 E 6.362(.T)-.55 G -.15(ex)-7.062 G 3.862(ti).15 G(s)
-3.862 E 1.36(totally ordered; thus markup')126 466.8 R 3.861(sm)-.55 G
1.361(ost natural use is to e)-3.861 F 1.361
(xpress orders that are consistent)-.15 F .33(with this total order)126
478.8 R 2.83(,s)-.4 G .33(uch as hierarchies.)-2.83 F .33
(It is interesting to speculate whether the widely)5.33 F .217
(accepted vie)126 490.8 R 2.717(wt)-.25 G .218(hat documents are hierar\
chical is a result of deep thought about document)-2.717 F 1.692
(structure, or simply a result of years of e)126 502.8 R 1.691
(xperience with mark)-.15 F 1.691(ed up te)-.1 F 4.191(xts. Whiche)-.15
F -.15(ve)-.25 G(r).15 E -.15(ex)126 514.8 S .867(planation is true, it\
has also been said that the interesting structures in documents are).15
F(lar)126 526.8 Q .157(gely the non-hierarchical ones[24].)-.18 F .157
(Proposed future applications such as h)5.157 F(yperte)-.05 E .157
(xt and)-.15 F(acti)126 538.8 Q .858 -.15(ve d)-.25 H .558
(ocuments are also non-hierarchical.).15 F(Ev)5.558 E .558
(en the table, ho)-.15 F(we)-.25 E -.15(ve)-.25 G 1.358 -.4(r, p).15 H
.558(roduces problems).4 F 1.529
(for markup and other systems that are based on a total order)126 550.8
R 6.529(.C)-.55 G 1.529(onsider the follo)-6.529 F(wing)-.25 E(table:)
126 562.8 Q -17.78 18.055(AB C)286 592.8 T .4 LW 349.61 597.3 262.39
597.3 DL 15(X2)262.39 606.8 S 15(45)-15 G 17.5(51)-15 G(9)-17.5 E -17.5
17.5(Y3 01)262.39 618.8 T(23)-17.5 E -18.61 18.055(Z1 1)262.945 630.8 T
(1)4.445 E 277.11 583.3 277.11 633.3 DL EP
%%Page: 10 11
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(10)126 66 Q .127
(Instances of tables can be captured as sequentially tagged te)126 120 R
2.627(xts. F)-.15 F .127(or e)-.15 F .127(xample, the preced-)-.15 F
(ing table might be represented in the follo)126 132 Q(wing w)-.25 E
(ay:)-.1 E/F1 10/Courier@0 SF(center;)126 156 Q 6(c|ccc)126 168 S(.)-6 E
19(ABC)151 180 S(_)126 192 Q 19(X2)126 204 S 13(45)-19 G 13(51)-13 G(9)
-13 E 19(Y301)126 216 S(23)-19 E 19(Z111)126 228 S F0 1.243
(The \214rst problem with representing tables as mark)126 264 R 1.243
(ed-up te)-.1 F 1.243(xts is the scarce resource of)-.15 F 1.16
(positions, described pre)126 276 R(viously)-.25 E 6.16(.T)-.65 G 1.16
(he w)-6.16 F 1.16(ords in a te)-.1 F 1.16
(xt belong to a single sequential rela-)-.15 F .498(tionship, b)126 288
R .498(ut the `w)-.2 F .498(ords' or data v)-.1 F .498
(alues in a table belong to multiple orthogonal relation-)-.25 F 3.745
(ships. Thus,)126 300 R 1.245(tables e)3.745 F 1.245
(xhibit the need to identify a te)-.15 F 1.246
(xt fragment as an instance of more)-.15 F .1(than one element type.)126
312 R .1(In the table preceding, the v)5.1 F .099
(alue 19 is both a C and an X, b)-.25 F .099(ut only)-.2 F
(one of these f)126 324 Q(acts is `near' the v)-.1 E(alue.)-.25 E .444
(The second problem is o)126 339.6 R -.15(ve)-.15 G 2.944
(rspeci\214cation. W).15 F 2.945(em)-.8 G .445
(ight conclude from the mark)-2.945 F .445(ed-up repre-)-.1 F .453
(sentation of the table that 123 `follo)126 351.6 R .452
(ws' 19, since it comes later in the sequence.)-.25 F .452(But the)5.452
F .54(table does not require this, unless it is the case that Y follo)
126 363.6 R .541(ws X.)-.25 F .541(The linear structure of)5.541 F
(the te)126 375.6 Q(xt is an o)-.15 E -.15(ve)-.15 G
(rspeci\214cation of this \(and an).15 E 2.5(yo)-.15 G(ther\) set-v)-2.5
E(alued structure.)-.25 E 3.192(At)126 391.2 S .692
(hird interesting dif)-3.192 F .692
(ference between tables and sequential te)-.25 F .691(xt is the dif)-.15
F .691(ference in nor)-.25 F(-)-.2 E 3.029(malization. As)126 403.2 R
.529(mentioned earlier)3.029 F 3.029(,t)-.4 G -.15(ex)-3.029 G .529
(ts are highly redundant in their data v).15 F .53(alues, b)-.25 F .53
(ut not)-.2 F 1.864(redundant in their use of positions.)126 415.2 R -.8
(Ta)6.864 G 1.863(bles, on the other hand, attempt to sho).8 F 4.363(we)
-.25 G(ach)-4.363 E .136
(datum only once, adjusting the layout so that the rele)126 427.2 R -.25
(va)-.25 G .137(nt dimensions impinge on the data).25 F -.25(va)126
439.2 S(lues in as natural a f).25 E(ashion as possible.)-.1 E .358
(The normalization implicit in tables and the redundanc)126 454.8 R
2.858(yi)-.15 G .358(mplicit in te)-2.858 F .358(xts is e)-.15 F .357
(vident in the)-.25 F(dif)126 466.8 Q .548
(ferent update operations needed for each.)-.25 F 2.149 -.8(To u)5.548 H
.549(pdate a te).8 F .549(xt, we typically use an editor)-.15 F 1.337(w\
ith a search-and-replace command, performing a redundant update to each\
cop)126 478.8 R 3.836(yo)-.1 G 3.836(fa)-3.836 G .929(data v)126 490.8
R 3.429(alue. T)-.25 F 3.429(oc)-.8 G .929(hange the w)-3.429 F .929
(ord `Constantinople' to `Istanb)-.1 F .929(ul', we perform a redundant)
-.2 F .658(operation on e)126 502.8 R -.15(ve)-.25 G .658
(ry instance of the w).15 F 3.158(ord. T)-.1 F 3.158(ou)-.8 G .657
(pdate a table v)-3.158 F .657(alue, on the other hand, we)-.25 F 1.026
(simply \214nd the single cop)126 514.8 R 3.526(yo)-.1 G 3.526(ft)-3.526
G 1.026(he v)-3.526 F 1.026
(alue and change it, and the change is automatically)-.25 F(`a)126 526.8
Q -.25(va)-.2 G .504(ilable' to each of the rele).25 F -.25(va)-.25 G
.503(nt dimensions.).25 F .503
(In the preceding table representation, we)8.003 F(need change the v)126
538.8 Q(alue 19 only once to af)-.25 E(fect both C and X.)-.25 E .534
(Structural update of tables represented in linear form is a dif)126
554.4 R .534(ferent matter)-.25 F 3.034(,h)-.4 G -.25(ow)-3.034 G -2.15
-.25(ev e).25 H 4.134 -.55(r. T).25 H(he).55 E .891(preceding mark)126
566.4 R .891(ed-up table supports ro)-.1 F 3.391(wi)-.25 G .891
(nterchanges, since this can be done simply by)-3.391 F .862
(interchanging lines of the te)126 578.4 R .862(xt \214le, b)-.15 F .863
(ut does not support column interchanges, since this)-.2 F .645
(requires editing each line separately)126 590.4 R 5.644(.T)-.65 G .644
(ransposition of the table is another operation that)-5.994 F -.1(wo)126
602.4 S .924(uld be e).1 F .924
(xceedingly tedious in this representation.)-.15 F -.8(Ta)5.924 G .924
(ble editing is generally not well).8 F 1.999(supported in most en)126
614.4 R 1.998
(vironments[31], and it is not our purpose here to complain that)-.4 F
.484(markup does not do better)126 626.4 R 5.484(.R)-.55 G(ather)-5.484
E 2.985(,w)-.4 G 2.985(ew)-2.985 G .485
(ish to emphasize that the order of te)-2.985 F .485(xt inherited)-.15 F
(by markup is the fundamental reason for this problem.)126 638.4 Q EP
%%Page: 11 12
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(11)476 66 Q .937(The o)126 120 R -.15(ve)-.15 G
.937(rspeci\214cation of order can also be a problem e).15 F -.15(ve)
-.25 G 3.437(nf).15 G .937(or apparently benign nested)-3.437 F(te)126
132 Q 2.865(xts. Consider)-.15 F .365(the follo)2.865 F .365
(wing fragment from a h)-.25 F .365
(ypothetical repair manual that lists prob-)-.05 F
(lems and their symptoms:)126 144 Q(section)291.835 173.56 Q(prob)
234.411 204.736 Q(prob)359.259 204.736 Q(symp)201.565 235.984 Q(symp)
263.989 235.984 Q(symp)326.341 235.984 Q(symp)388.765 235.984 Q .4 LW
243.576 193.176 306 180.72 DL 368.424 193.176 306 180.72 DL 212.4
224.352 243.576 211.896 DL 274.752 224.352 243.576 211.896 DL 337.248
224.352 368.424 211.896 DL 399.6 224.352 368.424 211.896 DL(In mark)126
269.744 Q(ed-up form, this might appear as:)-.1 E
(............)205.855 293.744 Q .475
(The symptoms are ordered within the problems, and the problems are ord\
ered within the)126 309.344 R 1.464(sections, b)126 321.344 R 1.464
(ut the order of the symptoms within the section has no meaning.)-.2 F
1.465(The total)6.465 F .622(order of the te)126 333.344 R .622
(xt is an o)-.15 F -.15(ve)-.15 G .621
(rspeci\214cation of the partial order in).15 F -.2(vo)-.4 G(lv).2 E
.621(ed in the structure.)-.15 F(As)5.621 E -.1(wa)126 345.344 S 2.5(st)
.1 G(he case with granularity)-2.5 E 2.5(,s)-.65 G(tructure is not al)
-2.5 E -.1(wa)-.1 G(ys reducible to character positions.).1 E .549
(The representation of non-linear orders is also a problem.)126 360.944
R .549(Markup adv)5.549 F .55(ocates ha)-.2 F .85 -.15(ve g)-.2 H -2.15
-.25(iv e).15 H(n).25 E 1.281(considerable thought to the problems of r\
epresenting multiple and discontiguous struc-)126 372.944 R 2.562
(tures. These)126 384.944 R .062(problems ha)2.562 F .362 -.15(ve n)-.2
H -2.15 -.25(ev e).15 H 2.562(rb).25 G .062(een seen to be f)-2.562 F
.062(atal; on the other hand, a resoundingly)-.1 F(satisf)126 396.944 Q
(actory solution to such problems has yet to be de)-.1 E
(vised[1, 2, 21, 14, 22].)-.25 E 1.071
(The fourth and \214nal class of dif)126 412.544 R 1.071
(\214culties arises from markup')-.25 F 3.571(si)-.55 G 1.07
(nheritance of the update)-3.571 F .69(properties of the te)126 424.544
R 3.19(xt. The)-.15 F .69
(virtue of sharing both update properties and resources is that)3.19 F
.11(structure can be updated with e)126 436.544 R .109
(xactly the same tools that are used to update the te)-.15 F .109
(xt itself,)-.15 F 1.178(thus ob)126 448.544 R 1.178
(viating the need to de)-.15 F -.15(ve)-.25 G 1.179
(lop a tool speci\214cally designed for structure update.).15 F(In)6.179
E .974(batch typesetter en)126 460.544 R .974(vironments, for e)-.4 F
.974(xample, users commonly emplo)-.15 F 3.474(yt)-.1 G .974
(heir standard te)-3.474 F(xt)-.15 E(editors to input the te)126 472.544
Q(xt and add the markup commands to that te)-.15 E(xt.)-.15 E 1.128
(Updating markup as if it were te)126 488.144 R 1.128
(xt is acceptable when the update characteristics of the)-.15 F .12
(markup and the te)126 500.144 R .12(xt are comparable.)-.15 F .12
(In man)5.12 F 2.62(ys)-.15 G .12(ituations, ho)-2.62 F(we)-.25 E -.15
(ve)-.25 G .92 -.4(r, t).15 H .12(he update characteris-).4 F .752
(tics dif)126 512.144 R(fer)-.25 E 5.752(.S)-.55 G .752
(ome structures are much more dynamic than the te)-5.752 F .753
(xt; consider for e)-.15 F(xample)-.15 E .729
(identifying the structures `the w)126 524.144 R .728
(ord I am currently reading', or)-.1 F 3.228(,i)-.4 G 3.228(np)-3.228 G
.728(rogram source code,)-3.228 F .329(`all uses of the v)126 536.144 R
.33(ariable X after the nth iteration of loop Y' \(where n is speci\214\
ed dynami-)-.25 F 2.581(cally\)[25]. If)126 548.144 R .081(these struct\
ures are to be represented by markup, then we need to insert and)2.581 F
1.405(delete tags dynamically while using the te)126 560.144 R 3.905
(xt. Dynamic)-.15 F 1.405(structure thus requires that the)3.905 F(te)
126 572.144 Q 1.362(xt be updatable; if the te)-.15 F 1.362
(xt is read-only)-.15 F 3.862(,t)-.65 G 1.362(hen so is its structure.)
-3.862 F 1.362(Markup inherits the)6.362 F .327
(update properties of the te)126 584.144 R .328(xt, b)-.15 F .328
(ut in general the update properties of structure and content)-.2 F
(should be independent of one another)126 596.144 Q(.)-.55 E 3.52(As)126
611.744 S 1.019
(econd update problem is that as markup has become more comple)-3.52 F
1.019(x, it is less lik)-.15 F(ely)-.1 E 2.025(that te)126 623.744 R
2.026(xt editing tools will be suf)-.15 F 2.026
(\214cient for editing markup.)-.25 F 2.026(When markup consisted)7.026
F .944(mostly of simple strings that were lar)126 635.744 R .944
(gely conte)-.18 F .943(xt-independent \(as in batch typesetters\),)-.15
F .16(the use of a te)126 647.744 R .161(xt editor to update markup w)
-.15 F .161(as reasonably reliable.)-.1 F .161(Some markup systems,)
5.161 F .518(on the other hand, permit multiple attrib)126 659.744 R
.518(utes, insist on tag pairing, e)-.2 F -.15(ve)-.25 G 3.017(nt).15 G
.517(hough members)-3.017 F EP
%%Page: 12 13
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(12)126 66 Q .708(of the pair are widely separat\
ed \(although sometimes end tags can be eliminated\), allo)126 120 R(w)
-.25 E .848(ID v)126 132 R .847
(alues and cross-references to other tags or positions in the te)-.25 F
.847(xt, and usually require)-.15 F 1.22(conformance with some e)126 144
R 1.22(xternal structure such as a grammar)-.15 F 6.22(.C)-.55 G(omple)
-6.22 E 3.72(xm)-.15 G 1.22(arkup, then,)-3.72 F .751
(has reduced the original update adv)126 156 R .751(antage; man)-.25 F
3.251(yS)-.15 G .751(GML te)-3.251 F .75(xts should not be edited with)
-.15 F 1.245(simple te)126 168 R 1.245(xt editors, and retaining this c\
apability simply risks well-intentioned b)-.15 F 1.246(ut erro-)-.2 F
(neous manual editing.)126 180 Q .665(Markup e)126 195.6 R .665
(xhibits man)-.15 F 3.165(yp)-.15 G .664
(roperties that are not shared by non-embedded structures.)-3.165 F
(Non-)5.664 E 1.071(embedded structures need not consume te)126 207.6 R
1.071(xt resources, need not limit themselv)-.15 F 1.071(es to the)-.15
F 1.55(granularity of the te)126 219.6 R 1.55
(xt, need not inherit the order of the te)-.15 F 1.55
(xt, and need not inherit the)-.15 F(update characteristics of the te)
126 231.6 Q(xt.)-.15 E/F1 10/Times-Bold@0 SF 2.5(5. Alter)126 255.6 R
(nati)-.15 E .2 -.1(ve r)-.1 H(epr)-.08 E(esentations f)-.18 E(or text.)
-.25 E F0 .906(Our in)126 271.2 R -.15(ve)-.4 G(stig).15 E .906
(ation of the implications of te)-.05 F .907
(xt characteristics for markup has presupposed)-.15 F 1.677
(the standard electronic representation:)126 283.2 R 4.176(al)6.677 G
1.676(ist of characters ordered in accordance with)-4.176 F .067
(their appearance in an output medium.)126 295.2 R .068
(This representation seems so natural that its status)5.068 F .233
(as the de\214niti)126 307.2 R .532 -.15(ve f)-.25 H .232(orm of `te).15
F .232(xt' is not e)-.15 F -.15(ve)-.25 G 2.732(nq).15 G 2.732
(uestioned. There)-2.732 F .232(are other representations for)2.732 F
(te)126 319.2 Q .704(xt, ho)-.15 F(we)-.25 E -.15(ve)-.25 G 1.504 -.4
(r, a).15 H .705(nd by considering some of them we e).4 F .705
(xpose other issues in the design of)-.15 F
(document management systems.)126 331.2 Q 1.043(Consider the follo)126
346.8 R 1.043(wing representations, each intended to be a mark)-.25 F
1.042(ed-up v)-.1 F 1.042(ersion of the)-.15 F(same te)126 358.8 Q(xt:)
-.15 E 13.06(\(i\) to)126 374.4 R
(be or not to be; that is the question...)2.5 E 10.28
(\(ii\) <6><2>be2>6><8>is8><4>not4>)126 390 R
(<3>or3><10>question10><7>that7>)151 402 Q
(<9>the9><5><1>to1>5>)151 414 Q 7.5(\(iii\) &tb;)126
429.6 R(or not &tb;; that is the question)2.5 E 2.28
(Representation \(i\) is a straightforw)126 445.2 R 2.28
(ard sequential te)-.1 F 2.28(xt string with embedded markup.)-.15 F
.264(Representation \(ii\) is a sequence of w)126 457.2 R .264
(ords, ordered alphabetically)-.1 F 2.764(,a)-.65 G .264(nd mark)-2.764
F .263(ed up in such)-.1 F 2.588(aw)126 469.2 S .088(ay that the te)
-2.688 F .088(xt can be reproduced by follo)-.15 F .088
(wing the sequence de\214ned by the tag labels.)-.25 F 1.182
(Representation \(iii\) is ag)126 481.2 R 1.182(ain a sequential te)-.05
F 1.182(xt, b)-.15 F 1.181(ut some phrases ha)-.2 F 1.481 -.15(ve b)-.2
H 1.181(een f).15 F 1.181(actored out)-.1 F(and are represented as e)126
493.2 Q(xternal entities; the tag)-.15 E/F2 10/Courier@0 SF(&tb;)2.5 E
F0(maps to the phrase `to be'.)2.5 E 1.117(The choice between these rep\
resentations is usually made on operational grounds;)126 508.8 R(one)
6.118 E .531(chooses based on estimates of the need for compression, fo\
r particular types of e)126 520.8 R(xpected)-.15 E(query)126 532.8 Q
2.617(,o)-.65 G 2.617(rf)-2.617 G .118
(or control of update anomalies. Representation \(i\) requires f)-2.617
F .118(ar fe)-.1 F .118(wer tags and is)-.25 F .49(easily read; ho)126
544.8 R(we)-.25 E -.15(ve)-.25 G 1.29 -.4(r, i).15 H 2.989(tc).4 G .489
(ontains multiple occurrences of some w)-2.989 F .489(ords and so may e)
-.1 F(xhibit)-.15 E .962(inconsistent spelling.)126 556.8 R .963
(Representation \(ii\) appears to be less redundant, storing only one)
5.962 F(cop)126 568.8 Q 2.691(yo)-.1 G 2.691(fe)-2.691 G .191(ach w)
-2.691 F .191(ord. It can easily be used to generate a w)-.1 F .19
(ord list and frequenc)-.1 F 2.69(yc)-.15 G .19(ounts, b)-2.69 F(ut)-.2
E 1.429
(requires more processing to reproduce the canonical form of the te)126
580.8 R 1.43(xt \(of course, tech-)-.15 F .559
(nique \(i\) requires more processing to produce the w)126 592.8 R .559
(ord list and frequenc)-.1 F 3.059(yc)-.15 G 3.059(ounts\). Rep-)-3.059
F .546
(resentation \(iii\) is a middle-ground solution, with some redundanc)
126 604.8 R 3.047(ye)-.15 G .547(liminated, and only)-3.047 F 2.652(am)
126 616.8 S .152(edium amount of ef)-2.652 F .151
(fort required to read the te)-.25 F .151(xt \(much of the te)-.15 F
.151(xt is already in canon-)-.15 F(ical order)126 628.8 Q 2.5(,b)-.4 G
(ut there are frequent di)-2.7 E -.15(ve)-.25 G(rsions to access e).15 E
(xternal information\).)-.15 E 1.341(Representation \(ii\) may seem f)
126 644.4 R(ar)-.1 E 1.342(-fetched to those for whom it is patently ob)
-.2 F 1.342(vious that)-.15 F(te)126 656.4 Q .861
(xts are ordered sequences.)-.15 F .861
(But this technique is simply a tagged v)5.861 F .86
(ersion of structures)-.15 F EP
%%Page: 13 14
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(13)476 66 Q .071
(that we otherwise recognize as the common concordance, the in)126 120 R
-.15(ve)-.4 G .071(rted list, or the back-of-).15 F 1.299(the-book inde)
126 132 R 3.799(x. Each)-.15 F 1.299(is an or)3.799 F -.05(ga)-.18 G
1.299(nization of a te).05 F 1.298
(xt to support a speci\214c kind of access.)-.15 F .556
(Each is a complete structure, containing the whole te)126 144 R .557
(xt; otherwise it w)-.15 F .557(ould not be possi-)-.1 F(ble to ef)126
156 Q(fect reconstruction of the Dead Sea Scrolls from a published conc\
ordance[30].)-.25 E .865(Operational concerns are important. Ho)126
171.6 R(we)-.25 E -.15(ve)-.25 G 1.665 -.4(r, t).15 H(he).4 E 3.365(yt)
-.15 G .864(end to strengthen the ar)-3.365 F .864(gument that)-.18 F
1.235(issues of markup are issues of representation of structure, and n\
ot of its abstract form.)126 183.6 R 1.174(There is one abstract issue \
that is implicit in the choice of representations, common to)126 195.6 R
(man)126 207.6 Q 3.546(yd)-.15 G 1.046(ata modelling situations:)-3.546
F 1.046(deciding what constitutes `one thing'[15].)6.046 F 1.046
(The choice)6.046 F .184(of representation can be an implicit statement\
of our notion of object, because each struc-)126 219.6 R 1.035
(ture is optimized to manage a speci\214c type of object.)126 231.6 R
1.035(Representation \(i\) is designed to)6.035 F .045
(store not characters, b)126 243.6 R .045(ut the positions that the)-.2
F 2.545(yo)-.15 G(ccup)-2.545 E 1.344 -.65(y. T)-.1 H .044
(hus, it distinguishes between and).65 F 1.765
(maintains the identity of positions.)126 255.6 R 1.766
(Representation \(ii\) is designed to store indi)6.765 F(vidual)-.25 E
-.1(wo)126 267.6 S 2.554(rds. Since).1 F .054
(the sequence of the `original' te)2.554 F .054
(xt is captured in the order implicit in the tag)-.15 F .449(identi\214\
ers, the sequence in the data structure is free to be used for some oth\
er purpose\212)126 279.6 R .109(in this case, the le)126 291.6 R .109
(xicographic order of the w)-.15 F 2.608(ords. Representation)-.1 F .108
(\(iii\) stores the positions)2.608 F .311(occupied by a mix)126 303.6 R
.311(ed bag of characters and phrases, and is designed to maintain the \
iden-)-.15 F(tity of both the positions and the phrases.)126 315.6 Q .62
(Issues of identity are subtle, b)126 331.2 R .619
(ut not without impact.)-.2 F .619(In a relational database, tw)5.619 F
3.119(ot)-.1 G(uples)-3.119 E .451(with the same k)126 343.2 R .751 -.15
(ey i)-.1 H 2.951(nf).15 G .451(act denote only one thing.)-3.051 F .451
(In a traditional te)5.451 F .452(xt database using rep-)-.15 F .485
(resentation \(i\), tw)126 355.2 R 2.985(oo)-.1 G .485(ccurrences of `t\
o be' are still separate objects; in representation \(iii\))-2.985 F
(the)126 367.2 Q 2.637(ya)-.15 G .137
(re copies of the same object; in representation \(ii\) the)-2.637 F
2.637(ya)-.15 G .137(re made up of copies of the)-2.637 F
(objects `to' and `be'.)126 379.2 Q .871(Identity is also important in \
normalization, an issue that has remained lar)126 394.8 R .87
(gely hidden in)-.18 F .003(document management systems.)126 406.8 R
.003(Normalization is the process of adjusting the design of a)5.003 F
.003(database so that updates will not result in anomalies.)126 418.8 R
.003(One of the bene\214ts of normalization)5.003 F .815
(is reduced redundanc)126 430.8 R 4.615 -.65(y. T)-.15 H .815
(he three representations dif).65 F .815(fer in the types of redundanc)
-.25 F 3.315(yt)-.15 G(he)-3.315 E(y)-.15 E 2.746
(permit. Representation)126 442.8 R .246(\(i\) has redundanc)2.746 F
2.746(yi)-.15 G 2.746(nw)-2.746 G .246(ords \(hence, as noted earlier)
-2.846 F 2.745(,t)-.4 G .245(he potential)-2.745 F 1.469
(for inconsistent spelling\), whereas representation \(ii\) has remo)126
454.8 R -.15(ve)-.15 G 3.969(dt).15 G 1.469(he redundanc)-3.969 F 3.969
(yt)-.15 G(hat)-3.969 E -.1(fa)126 466.8 S 1.294
(cilitates this inconsistenc).1 F 5.094 -.65(y. R)-.15 H 1.293
(epresentation \(i\) has eliminated redundanc).65 F 3.793(yi)-.15 G
3.793(np)-3.793 G(osition,)-3.793 E 1.47
(whereas representation \(ii\) may ha)126 478.8 R 1.77 -.15(ve r)-.2 H
(edundanc).15 E 3.97(yi)-.15 G 3.97(np)-3.97 G 1.47
(ositions; that is, it permits man)-3.97 F(y)-.15 E 2.091
(instances of tag pairs ..., for some number n, thus allo)126
490.8 R 2.09(wing synon)-.25 F 2.09(yms \(e.g.,)-.15 F
(<65>Constantinople65>...<65>Istanb)126 502.8 Q .511
(ul65>\) to occur in the te)-.2 F 3.012(xt. Representation)-.15 F
(\(iii\))3.012 E .093(has remo)126 514.8 R -.15(ve)-.15 G 2.593(dt).15 G
.092(he redundanc)-2.593 F 2.592(yi)-.15 G 2.592(ns)-2.592 G .092
(ome common phrases, b)-2.592 F .092(ut it has also remo)-.2 F -.15(ve)
-.15 G 2.592(dt).15 G .092(he redun-)-2.592 F(danc)126 526.8 Q 2.5(yo)
-.15 G 2.5(fp)-2.5 G(osition.)-2.5 E(Else)126 542.4 Q 2.627(where we ha)
-.25 F 2.927 -.15(ve a)-.2 H -.18(rg).15 G 2.627(ued that softw).18 F
2.628(are design is often concerned with the choice)-.1 F .895
(between normalization and automatic processing.)126 554.4 R .895
(Systems can be constructed based on)5.895 F 1.412
(normalized data, or the)126 566.4 R 3.913(ym)-.15 G 1.413(ay track e)
-3.913 F 1.413(xisting redundanc)-.15 F 3.913(ya)-.15 G 1.413
(nd perform redundant opera-)-3.913 F .655
(tions as necessary when updates are requested[27].)126 578.4 R
(Similarly)5.655 E 3.155(,i)-.65 G 3.155(nd)-3.155 G .655
(ocument management)-3.155 F .915(systems, we often choose between redu\
ndant storage of information and automatic pro-)126 590.4 R 3.504
(cessing. Such)126 602.4 R 1.003
(issues can be described in formal terms for traditional databases, b)
3.503 F 1.003(ut we)-.2 F
(are not yet capable of doing this for document databases.)126 614.4 Q
1.936(In traditional database management systems, normalization is base\
d on e)126 630 R 1.936(xplicit state-)-.15 F .86
(ments of data dependencies, such as functional and multi)126 642 R -.25
(va)-.25 G .86(lued dependencies.).25 F .86(In tradi-)5.86 F .699(tiona\
l document management systems, such dependencies are implicit in the op\
erational)126 654 R EP
%%Page: 14 15
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(14)126 66 Q 2.464
(descriptions of the processors.)126 120 R 2.464
(Representation \(iii\), for e)7.464 F 2.464
(xample, de\214nes an implicit)-.15 F(dependenc)126 132 Q 3.12(yb)-.15 G
.62(etween the e)-3.12 F .62
(xternal phrase and the entity reference placed in the te)-.15 F 3.12
(xt. The)-.15 F .138
(implicit use of dependencies is not necessarily bad.)126 144 R(Ho)5.138
E(we)-.25 E -.15(ve)-.25 G .938 -.4(r, w).15 H 2.638(em).4 G .138
(ust at some point dis-)-2.638 F 1.662
(tinguish between the formal aspects of the dependenc)126 156 R 4.162
(ys)-.15 G 1.662(tructure and their operational)-4.162 F(ef)126 168 Q
2.781(fects. The)-.25 F .281(former belongs to a theory of document man\
agement systems, while the lat-)2.781 F
(ter belongs to discussions of their implementation.)126 180 Q/F1 10
/Times-Bold@0 SF 2.5(6. Requir)126 204 R(ements f)-.18 E
(or document management systems.)-.25 E F0 .074(Document management sys\
tems are a type of database management system, and thus will)126 219.6 R
.923(share with traditional databases issues such as storage, searching\
, normalization, update)126 231.6 R .567
(through transaction control, the possibility of distrib)126 243.6 R
.568(uted data and the possibility for par)-.2 F(-)-.2 E .193
(allel processing.)126 255.6 R .193
(But document management systems are not simply reducible to e)5.193 F
(xisting)-.15 E .441(database systems, because documents ha)126 267.6 R
.742 -.15(ve s)-.2 H .442(peci\214c requirements that are not common in)
.15 F 1.118(traditional database processing.)126 279.6 R 2.717 -.8(We n)
6.118 H -.15(ex).8 G 3.617(te).15 G 1.117
(xplore some of these requirements, and con-)-3.767 F(sider markup')126
291.6 Q 2.5(sa)-.55 G(bility to address them.)-2.5 E F1(Modelling)126
307.2 Q F0 5.675(.T)C .675(he \214rst area of dif)-5.675 F .675
(ference between te)-.25 F .676(xt databases and traditional databases)
-.15 F 1.421(is the lik)126 319.2 R 1.421(elihood of schema update.)-.1
F 1.421(In traditional databases, the data model is usually)6.421 F .713
(static; it is carefully determined in adv)126 331.2 R .713
(ance, as a de\214niti)-.25 F 1.013 -.15(ve s)-.25 H .713
(tatement of the or).15 F -.05(ga)-.18 G(nization).05 E .216(or w)126
343.2 R .216(orld it is intended to represent.)-.1 F .215
(When the data is loaded, modelling is ef)5.215 F(fecti)-.25 E -.15(ve)
-.25 G .215(ly ter).15 F(-)-.2 E 1.592(minated; the data will change, b)
126 355.2 R 1.592(ut the model of the w)-.2 F 1.592
(orld generally stays constant or)-.1 F -2.2 -.25(ev o)126 367.2 T(lv)
.25 E .418(es slo)-.15 F(wly)-.25 E 5.418(.I)-.65 G 2.917(nd)-5.418 G
.417(ocument databases, on the other hand, putting te)-2.917 F .417
(xt online is the \214rst,)-.15 F .512(not the last, step in de)126
379.2 R -.15(ve)-.25 G .512(loping a data model.).15 F .512
(Where numeric data is an interpretation of)5.512 F .14(the w)126 391.2
R .14(orld, man)-.1 F 2.64(yt)-.15 G -.15(ex)-2.64 G .14
(ts are themselv).15 F .14(es w)-.15 F .14
(orlds to be interpreted, and thus the need for mod-)-.1 F .282
(elling is potentially in\214nite.)126 403.2 R .282(Each model of a te)
5.282 F .282(xt can point to dif)-.15 F .283(ferent structures, dif)-.25
F(fer)-.25 E(-)-.2 E .213(ent elements, and dif)126 415.2 R .212(ferent\
constraints, since an essential property of interpretation is cre-)-.25
F(ati)126 427.2 Q(vity)-.25 E 5(.T)-.65 G(hus, in document databases, t\
here is often a need for dynamic modelling.)-5 E(Markup')126 442.8 Q
3.193(sa)-.55 G .694(bility to ful\214ll this need is se)-3.193 F -.15
(ve)-.25 G .694(rely limited.).15 F .694(The binding of markup')5.694 F
3.194(su)-.55 G(pdate)-3.194 E .974(properties to those of the te)126
454.8 R .973(xt sti\215es the addition of ne)-.15 F 3.473(wd)-.25 G .973
(ata models.)-3.473 F(Markup')5.973 E 3.473(su)-.55 G .973(se of)-3.473
F(te)126 466.8 Q 1.381
(xt resources means that such additions \(and hence, changes to the te)
-.15 F 1.381(xt\) will ha)-.15 F 1.681 -.15(ve a)-.2 H(n).15 E(ef)126
478.8 Q .052(fect on both internal structure \(e)-.25 F .052
(xisting markup\) and e)-.15 F .051
(xternal structure \(pointers into the)-.15 F(te)126 490.8 Q 3.215
(xt\). Markup')-.15 F 3.215(sg)-.55 G(ranularity)-3.215 E 3.215(,a)-.65
G 3.215(sw)-3.215 G 3.215(en)-3.215 G .715(oted earlier)-3.215 F 3.215
(,a)-.4 G .716(lso limits its ability to represent struc-)-3.215 F 1.363
(tures that are continuous in some w)126 502.8 R(ay)-.1 E 6.362(.C)-.65
G 1.362(omplaints about markup standards are some-)-6.362 F 2.151
(times indicati)126 514.8 R 2.451 -.15(ve o)-.25 H 4.651(ft).15 G 2.152
(he fear that markup will interfere with the free interpretation of)
-4.651 F(te)126 526.8 Q(xts[21].)-.15 E F1(Independence)126 542.4 Q F0
5.742(.A)C .742(second area of dif)-2.5 F .742(ference between te)-.25 F
.741(xt and traditional data is in their)-.15 F(dif)126 554.4 Q .243
(fering vie)-.25 F .243(ws of ho)-.25 F 2.743(wt)-.25 G 2.743(oa)-2.743
G(chie)-2.743 E .543 -.15(ve m)-.25 H .243
(odularity and independence in the systems.).15 F .244(The doc-)5.243 F
.288(ument community focuses on ensuring modularity at the le)126 566.4
R -.15(ve)-.25 G 2.788(lo).15 G 2.788(ft)-2.788 G .288
(he data, by insisting on)-2.788 F 2.099
(the interchangeability of documents.)126 578.4 R(Gi)7.099 E -.15(ve)
-.25 G 4.599(na).15 G 4.599(na)-4.599 G 2.099(ppropriately mark)-4.599 F
2.099(ed-up document, it)-.1 F .355
(should be possible to transmit it to an)126 590.4 R 2.855(yo)-.15 G
.354(ther document management system, its structure)-2.855 F 2.835
(intact. The)126 602.4 R .336(traditional database community)2.835 F
2.836(,o)-.65 G 2.836(nt)-2.836 G .336
(he other hand, focuses on ensuring mod-)-2.836 F .953
(ularity at the user')126 614.4 R 3.452(sl)-.55 G -2.15 -.25(ev e)-3.452
H .952(l, insisting on the interchangeability of systems.).25 F(Gi)5.952
E -.15(ve)-.25 G 3.452(nas).15 G .952(et of)-3.452 F .388
(data and an SQL query)126 626.4 R 2.888(,a)-.65 G .688 -.15(ny r)-2.888
H .389(elational system and an).15 F 2.889(yh)-.15 G(ardw)-2.889 E .389
(are should pro)-.1 F .389(vide the same)-.15 F .409(result tables.)126
638.4 R .408(The document community does not \(yet\) insist that querie\
s posed on docu-)5.409 F .539(ments should produce the same result at e\
ach site, and the database community does not)126 650.4 R EP
%%Page: 15 16
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(15)476 66 Q(\(yet\) insist that there be a comm\
on interchange format for relational data.)126 120 Q .712(Insistence on\
the independence of the data underscores the importance of markup to t\
he)126 135.6 R .698(document community)126 147.6 R 3.198(,a)-.65 G .698
(nd illustrates wh)-3.198 F 3.198(yt)-.05 G .698(he de)-3.198 F -.15(ve)
-.25 G .698(lopment of standards for representing).15 F .24
(syntax has been considered an important task.)126 159.6 R .239
(This can be contrasted with the traditional)5.239 F .48
(database community)126 171.6 R 2.98(,f)-.65 G .48
(or whom it has been unimportant to settle on common formats for)-2.98 F
-.15(ex)126 183.6 S 1.165(changing relational data, since much of this \
data resides in only one location, and is).15 F .016
(constantly being updated in an)126 195.6 R 2.516(yc)-.15 G 2.516
(ase. On)-2.516 F .016(the other hand, the traditional database commu-)
2.516 F .383(nity insists on the independence of their applications fro\
m underlying hardw)126 207.6 R .383(are and soft-)-.1 F -.1(wa)126 219.6
S 1.249(re, and de).1 F -.15(ve)-.25 G 1.249
(loped abstract models that w).15 F 1.249
(ould ensure this independence, because the)-.1 F .384
(applications to be run were e)126 231.6 R(xpensi)-.15 E .683 -.15(ve t)
-.25 H 2.883(od).15 G -2.15 -.25(ev e)-2.883 H .383
(lop and can be more enduring than the data).25 F .685(\(for e)126 243.6
R .685(xample, the application to compute payroll remains \214x)-.15 F
.686(ed, while indi)-.15 F .686(vidual salaries)-.25 F(change\).)126
255.6 Q .348(Generalized markup has played a dominant role in a)126
271.2 R -.1(wa)-.15 G -.1(ke).1 G .348
(ning users to the virtues of data).1 F(interchangeability)126 283.2 Q
5.457(.T)-.65 G .457(here are no)-5.457 F 2.957(ws)-.25 G -2.15 -.25
(ev e)-2.957 H .457(ral standards being de).25 F -.15(ve)-.25 G .457
(loped to layer operational).15 F 2.272
(interchangeability on top of markup.)126 295.2 R 2.271
(It will be important to ensure that operational)7.272 F
(semantics are not dri)126 307.2 Q -.15(ve)-.25 G 2.5(nb).15 G 2.5(yr)
-2.5 G(epresentational concerns.)-2.5 E/F1 10/Times-Bold@0 SF(Display)
126 322.8 Q F0 5.402(.T)C .403(he third area of dif)-5.402 F .403
(ference between te)-.25 F .403(xt and traditional data is in display)
-.15 F 2.903(.T)-.65 G(ra-)-3.253 E .113(ditional database information \
is display-independent; it does not matter signi\214cantly what)126
334.8 R .015
(type of characters are used to print salary information, for e)126
346.8 R 2.516(xample. One)-.15 F .016(might dress up a)2.516 F .012
(report with pie charts and other graphs that illustrate trends more ef)
126 358.8 R(fecti)-.25 E -.15(ve)-.25 G .011(ly than a simple).15 F .229
(table of v)126 370.8 R .229(alues, b)-.25 F .229
(ut these displays are not themselv)-.2 F .23
(es considered to be an essential part of)-.15 F .375(the data.)126
382.8 R .375(Display is much more important to document databases.)5.375
F -.15(Fo)5.375 G 2.875(rm).15 G(an)-2.875 E 2.875(yd)-.15 G(ocuments,)
-2.875 E .711(there is an original printed v)126 394.8 R .712
(ersion whose display is information-bearing \(for scholars at)-.15 F
3.69(least\). Thus,)126 406.8 R 1.19
(some aspects of the original layout of the te)3.69 F 1.19
(xt are important information.)-.15 F(Ev)126 418.8 Q .417
(en if the document ne)-.15 F -.15(ve)-.25 G 2.918(re).15 G .418
(xisted in paper form, ho)-3.068 F(we)-.25 E -.15(ve)-.25 G 1.218 -.4
(r, d).15 H .418(isplay is important because).4 F .213(the end result o\
f searching a document database is the location of a te)126 430.8 R .212
(xt that is to be read,)-.15 F 1.88(and reading is intimately in)126
442.8 R -.2(vo)-.4 G(lv).2 E 1.88(ed with layout.)-.15 F 1.88
(Documents are in f)6.88 F 1.88(act considered by)-.1 F 1.169
(some researchers to be interchangeable with displays; e)126 454.8 R
-.15(ve)-.25 G 1.169(ry display is a form of docu-).15 F(ment, and e)126
466.8 Q -.15(ve)-.25 G(ry document is a form of display[4, 26].).15 E
1.319(Markup, whether presentational or generalized has long been the m\
ethod for installing)126 482.4 R 1.034
(display information in online documents.)126 494.4 R 1.033
(Markup can be used to identify virtually an)6.033 F(y)-.15 E(indi)126
506.4 Q .692(vidual layout, and generalized markup is an ef)-.25 F
(fecti)-.25 E .992 -.15(ve w)-.25 H .693(ay to describe man).05 F 3.193
(yt)-.15 G .693(ypes of)-3.193 F(equi)126 518.4 Q -.25(va)-.25 G .659
(lence classes to parameterize the layout.).25 F .659
(On the other hand, markup')5.659 F 3.159(si)-.55 G(nheritance)-3.159 E
.282(of the update properties of the content interferes with markup')126
530.4 R 2.783(sa)-.55 G .283(bility to display features)-2.783 F 1.014
(that change more rapidly than the update of the content allo)126 542.4
R 3.514(ws. The)-.25 F 1.014(alteration of posi-)3.514 F .677(tions cau\
sed by the insertion of markup complicates the coupling of the display \
to other)126 554.4 R 3.151(processes. Markup')126 566.4 R 3.151(sg)-.55
G .651
(ranularity limits its ability to describe details of an original docu-)
-3.151 F(ment')126 578.4 Q 3.123(sa)-.55 G .623(ppearance that are not \
properties of speci\214c collections of characters \(for e)-3.123 F
(xam-)-.15 E .972(ple, a fold in the page or lacunae in manuscripts\).)
126 590.4 R .972(And if documents are used as inter)5.972 F(-)-.2 E -.1
(fa)126 602.4 S 2.998(ces, the need to couple dynamic processes with th\
e document will con\215ict with).1 F(markup')126 614.4 Q 2.5(ss)-.55 G
(tatic modelling, as described earlier)-2.5 E(.)-.55 E 3.717(Aw)126 630
S 1.217(ord should be said about the relationship between logical and p\
resentational struc-)-3.817 F 2.596(ture. Adv)126 642 R .096
(ocates for descripti)-.2 F .396 -.15(ve m)-.25 H .096(arkup mak).15 F
2.596(eag)-.1 G .096(ood case that it is dif)-2.596 F .096
(\214cult to e)-.25 F .096(xtract log-)-.15 F 1.993
(ical structure from documents that are mark)126 654 R 1.993
(ed up presentationally)-.1 F 4.492(,t)-.65 G 1.992(he main problem)
-4.492 F EP
%%Page: 16 17
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(16)126 66 Q .153
(being that certain presentational ef)126 120 R .154
(fects are used to denote more than one logical element.)-.25 F(Ho)126
132 Q(we)-.25 E -.15(ve)-.25 G 2.009 -.4(r, i).15 H 3.709(ts).4 G 1.209
(eems too much to conclude, as is usually done, that presentation must \
be)-3.709 F(deri)126 144 Q -.15(ve)-.25 G 3.067(df).15 G .567
(rom logical structure.)-3.067 F .568
(First, there is no one logical structure to a document; the)5.568 F
.623(determination of logical structure must al)126 156 R -.1(wa)-.1 G
.622(ys be made with respect to some underlying).1 F(theory)126 168 Q
3.155(,a)-.65 G .655(nd there is no reason wh)-3.155 F 3.155(yt)-.05 G
.655(his theory must be in accord with a document')-3.155 F 3.155(sp)
-.55 G(re-)-3.155 E 3.126(sentation. Second,)126 180 R .626
(presentation has elements, constraints, and theories of its o)3.126 F
.625(wn, and it)-.25 F .54
(is reasonable for these to be managed in their o)126 192 R .541
(wn domain.)-.25 F -.15(Pa)5.541 G .541(ge layout, for e).15 F .541
(xample, is)-.15 F(not deri)126 204 Q -.25(va)-.25 G
(ble from the logical structures of documents.).25 E .912
(The requirements of document databases e)126 219.6 R .912
(xceed those of traditional databases.)-.15 F(Current)5.912 E .52
(markup practices ha)126 231.6 R .82 -.15(ve l)-.2 H .52
(ed to the recognition of some of these requirements.).15 F .52
(It is impor)5.52 F(-)-.2 E 1.112(tant to note, ho)126 243.6 R(we)-.25 E
-.15(ve)-.25 G 1.912 -.4(r, t).15 H 1.112
(hat none of the requirements logically requires embedded struc-).4 F
4.03(ture. Markup)126 255.6 R 1.53
(is not a necessity for document management systems; rather)4.03 F 4.03
(,i)-.4 G 4.03(ti)-4.03 G 4.03(sc)-4.03 G(om-)-4.03 E .06(monly emplo)
126 267.6 R .06(yed for the con)-.1 F -.15(ve)-.4 G .06(niences we ha)
.15 F .36 -.15(ve c)-.2 H .06(ome to e).15 F .06(xpect and the e)-.15 F
.06(xperience that we)-.15 F(ha)126 279.6 Q 1.121 -.15(ve g)-.2 H .821
(ained with its use.).1 F 2.421 -.8(We s)5.821 H .821(hould be a).8 F
-.1(wa)-.15 G .821(re of its tradeof).1 F .821(fs so that we kno)-.25 F
3.322(ww)-.25 G .822(hen to)-3.322 F
(use it, and when to use other structures.)126 291.6 Q/F1 10
/Times-Bold@0 SF 2.5(7. Discussion.)126 315.6 R F0 .105(Prior to the in\
troduction of relational databases, traditional database systems were u\
sually)126 331.2 R .812(described operationally)126 343.2 R 5.812(.E)
-.65 G .812(ach database system w)-5.812 F .812
(as de\214ned as a data structure and a set)-.1 F 2.181
(of operations on that structure.)126 355.2 R 2.181
(IMS databases, for e)7.181 F 2.181(xample, pro)-.15 F 2.181
(vided a hierarchical)-.15 F 1.037(structure and operations for na)126
367.2 R(vig)-.2 E 1.037(ating, querying and updating that hierarch)-.05
F 4.838 -.65(y. W)-.05 H 1.038(ith the).25 F(adv)126 379.2 Q .087(ent o\
f the relational model, the database community recognized the virtues o\
f de\214ning)-.15 F .833(the or)126 391.2 R -.05(ga)-.18 G .834(nizatio\
n of data in terms of mathematical abstractions, usually in terms of al\
ge-).05 F 2.803(bras. Mathematical)126 403.2 R .303(abstractions ha)
2.803 F .603 -.15(ve t)-.2 H .303(he adv).15 F .303(antage that the)-.25
F 2.802(ya)-.15 G .302(re separate from their rep-)-2.802 F
(resentations, and are susceptible to theoretical in)126 415.2 Q -.15
(ve)-.4 G(stig).15 E(ation.)-.05 E 1.612
(Markup-based document management systems are still lar)126 430.8 R
1.612(gely de\214ned in terms of the)-.18 F .37
(sequential data structure that is considered to be `te)126 442.8 R 2.87
(xt'. Lik)-.15 F 2.87(eI)-.1 G .37(MS databases, the)-2.87 F 2.87(yt)
-.15 G .37(end to)-2.87 F .477(see e)126 454.8 R -.15(ve)-.25 G .477
(ry te).15 F .477(xt structure as a hierarch)-.15 F 1.777 -.65(y, p)-.05
H .477(ossibly de\214ned by a grammar).65 F 5.478(.A)-.55 G 2.978(sar)
-5.478 G .478(esult, these)-2.978 F .984(systems will suf)126 466.8 R
.984
(fer problems similar to those of databases not based on a mathematical)
-.25 F 3.362(model[6]. In)126 478.8 R(particular)3.362 E 3.362(,f)-.4 G
.863(undamental issues of identity and dependenc)-3.362 F 3.363(yw)-.15
G .863(ill continue to)-3.363 F
(be hard to separate from discussions about representations of data.)126
490.8 Q .622(Markup and markup-based systems address a v)126 506.4 R
.622(ariety of issues simultaneously)-.25 F 3.122(,i)-.65 G(ncluding)
-3.122 E 1.852
(data interchange, data modelling, and storage representation.)126 518.4
R(Markup')6.852 E 4.353(sa)-.55 G(dv)-4.353 E 1.853(ocates see)-.2 F
.075(this combination as a strength.)126 530.4 R 1.675 -.8(We s)5.075 H
.075(uggest that the separation of these concerns is impor).8 F(-)-.2 E
.133(tant in the long term for document management systems, just as it \
has been for databases.)126 542.4 R .59
(Markup is not a data model, it is a type of data representation.)126
554.4 R .589(Since the formal proper)5.589 F(-)-.2 E .306(ties of docum\
ent management systems should be based on mathematical models, markup)
126 566.4 R(is unlik)126 578.4 Q(ely to pro)-.1 E(vide a satisf)-.15 E
(actory basis for document management systems.)-.1 E .588(Separating re\
presentational concerns from data modelling concerns may help to clear \
up)126 594 R 2.203(current disputes about the true potential of markup \
standards for document manage-)126 606 R .901(ment[29, 5].)126 618 R
-.15(Pa)5.901 G .901(rt of the problem is that adv).15 F .901
(ocates of markup claim adv)-.2 F .9(antages that are)-.25 F 1.631
(neither e)126 630 R(xclusi)-.15 E 1.931 -.15(ve t)-.25 H 4.132(om).15 G
1.632(arkup nor particularly attendant on its use.)-4.132 F(Descripti)
6.632 E -.15(ve)-.25 G 1.632(ness and).15 F(portability)126 642 Q 4.277
(,f)-.65 G 1.776
(or instance, are not con\214ned to certain types of markup, the)-4.277
F 4.276(ya)-.15 G 1.776(re merely)-4.276 F .773
(properties that intelligent use of markup share with man)126 654 R
3.273(yo)-.15 G .773(ther concei)-3.273 F -.25(va)-.25 G .773
(ble approaches.).25 F EP
%%Page: 17 18
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(17)476 66 Q 1.876
(Sometimes the actual claims for markup-based systems are o)126 120 R
-.15(ve)-.15 G 1.875(rstated; the claim that).15 F .355
(SGML results in portable documents, for e)126 132 R .356(xample, f)-.15
F .356(alls afoul of the observ)-.1 F .356(ation that it is)-.25 F .743
(possible to put angle brack)126 144 R .742(ets around)-.1 F/F1 10
/Times-Italic@0 SF(tr)3.242 E(of)-.45 E(f)-.18 E F0 .742
(tags, supply a simple document type descrip-)3.242 F(tor)126 156 Q
3.326(,a)-.4 G .826(nd thereby achie)-3.326 F 1.126 -.15(ve a)-.25 H
3.326(nS).15 G .826(GML-compliant document, without g)-3.326 F .826
(aining an)-.05 F 3.326(yp)-.15 G(ortability)-3.326 E .856(or descripti)
126 168 R -.15(ve)-.25 G .856(ness for the information.\207).15 F -.35
(Tr)5.856 G .855(ue portability requires not only that informa-).35 F
.185(tion be transportable from one machine to another)126 180 R 2.686
(,b)-.4 G .186(ut that the semantics of that informa-)-2.886 F .231
(tion be the same on either machine. SGML, in particular)126 192 R 2.731
(,c)-.4 G .23(laims to transfer no semantics,)-2.731 F
(so it surely cannot guarantee portability)126 204 Q(.)-.65 E(Gi)126
219.6 Q -.15(ve)-.25 G 2.996(na).15 G 2.996(nu)-2.996 G .496
(nderstanding of markup and its characteristics, what should we do ne)
-2.996 F 2.997(xt? One)-.15 F .519
(solution is to add a formal structure on top of markup-based systems.)
126 231.6 R .519(Such an approach)5.519 F .094(is tak)126 243.6 R .094
(en by Macleod)-.1 F F1 .094(et al.)2.594 F F0 2.595(,f)C .095(or e)
-2.595 F .095
(xample, in their proposal to layer an applications program)-.15 F
(interf)126 255.6 Q .268(ace on SGML[19].)-.1 F .267
(This reasonable approach has the adv)5.268 F .267(antage of le)-.25 F
-.15(ve)-.25 G .267(raging e).15 F(xist-)-.15 E 1.74
(ing markup-based systems.)126 267.6 R 1.741(From the point of vie)6.741
F 4.241(wo)-.25 G 4.241(fe)-4.241 G 1.741
(stablishing solid foundations,)-4.241 F(ho)126 279.6 Q(we)-.25 E -.15
(ve)-.25 G 2.517 -.4(r, t).15 H 1.717(his approach suf).4 F 1.717
(fers in that it will be pushed to support e)-.25 F 1.716
(xisting standards,)-.15 F
(where the formalism might suggest a departure.)126 291.6 Q 3.456(As)126
307.2 S .956(econd approach is to start with a mathematical abstraction\
for documents and try to)-3.456 F(de)126 319.2 Q -.15(ve)-.25 G .822
(lop a complete document management system top-do).15 F 3.322(wn. In)
-.25 F .821(this approach, it is the)3.322 F 1.468
(abstraction that is most important, representations come later)126
331.2 R 6.468(.T)-.55 G 1.469(his approach does not)-6.468 F(gi)126
343.2 Q 1.11 -.15(ve r)-.25 H .81(esults as quickly as the le).15 F -.15
(ve)-.25 G .81(raged approach, b).15 F .81
(ut it holds more potential for clearly)-.2 F 2.027
(separating the formal issues from the representational ones.)126 355.2
R 2.028(In the second approach,)7.027 F(markup is only one of man)126
367.2 Q 2.5(yp)-.15 G(otential forms of representation)-2.5 E/F2 10
/Times-Bold@0 SF 2.5(8. Ackno)126 391.2 R(wledgements.)-.1 E F0 1.731
(This w)126 406.8 R 1.731(ork w)-.1 F 1.731
(as \214nancially supported by an IBM Canada Research Fello)-.1 F 1.73
(wship, by the)-.25 F 1.535(Information T)126 418.8 R 1.535
(echnology Research Centre of Ontario, and by the Natural Sciences and)
-.7 F 2.737(Engineering Research Council of Canada.)126 430.8 R 4.337
-.8(We w)7.737 H 2.737(ould lik).7 F 5.237(et)-.1 G 5.236(ot)-5.237 G
2.736(hank Ste)-5.236 F 3.036 -.15(ve d)-.25 H 5.236(eR).15 G(ose,)
-5.236 E 3.957(Michael Sperber)126 442.8 R 3.957(g-McQueen, Anne Br)-.18
F -4.165.835 G 3.958(ggemann-Klein, and Robin Co)4.165 F -.15(ve)
-.15 G 6.458(rf).15 G 3.958(or their)-6.458 F
(thoughtful comments on early drafts of this paper)126 454.8 Q(.)-.55 E
.32 LW 198 636.2 126 636.2 DL/F3 8/Times-Roman@0 SF(\207This ar)126 648
Q(gument w)-.144 E(as pro)-.08 E(vided to us by Ste)-.12 E .24 -.12
(ve d)-.2 H 2(eR).12 G(ose.)-2 E EP
%%Page: 18 19
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(18)126 66 Q/F1 10/Times-Bold@0 SF(Refer)126 120
Q(ences)-.18 E F0 15(1. Da)126 135.6 R .468(vid Barnard, Ron Hayter)-.2
F 2.968(,M)-.4 G .468(aria Karababa, Geor)-2.968 F .468(ge Log)-.18 F
.468(an, and John McF)-.05 F(adden,)-.15 E 1.819
(\231SGML-Based Markup for Literary T)151 147.6 R -.15(ex)-.7 G 1.819
(ts: T).15 F 2.019 -.1(wo P)-.8 H 1.819(roblems and Some Solutions,).1 F
<9a>-.7 E/F2 10/Times-Italic@0 SF(Computer)151 159.6 Q 2.5(sa)-.1 G
(nd the Humanities,)-2.5 E F0(22, pp. 265-276 \(1988\).)2.5 E 15(2. Da)
126 175.2 R 1.748(vid Barnard, Lou Burnard, Jean-Pierre Gaspart, L)-.2 F
1.747(ynne Price, C.M. Sperber)-.55 F(g-)-.18 E .218
(McQueen, and Nino V)151 187.2 R .218
(arile, \231Notes on SGML Solutions to Markup Problems,)-1.11 F 2.719
<9a54>-.7 G(EI)-2.719 E(ML)151 199.2 Q(W18, T)-.74 E -.15(ex)-.7 G 2.5
(tE).15 G(ncoding Initiati)-2.5 E .3 -.15(ve \()-.25 H
(April 16, 1992\).).15 E 15(3. La)126 214.8 R 2.098
(wrence A. Barsalou, \231)-.15 F 2.097(Ad Hoc Cate)-.8 F(gories,)-.15 E
<9a>-.7 E F2 2.097(Memory & Co)4.597 F(gnition,)-.1 E F0 2.097
(11, 3, pp.)4.597 F(211-227 \(1983\).)151 226.8 Q 15(4. Eric)126 242.4 R
.606(A. Bier and Aaron Goodisman, \231Documents as User Interf)3.106 F
(aces,)-.1 E<9a>-.7 E F2(Pr)3.106 E(oceedings)-.45 E .499
(of the International Confer)151 254.4 R .499(ence on Electr)-.37 F .499
(onic Publishing)-.45 F 2.998(,D)-.1 G .498(ocument Manipulation)-2.998
F(and T)151 266.4 Q(ypo)-.74 E(gr)-.1 E(aphy)-.15 E(,)-.55 E F0
(pp. 249-262, Gaithersb)2.5 E(ur)-.2 E(g, Maryland \(September 1990\).)
-.18 E 15(5. P)126 282 R 1.842
(at Byrne, \231SGML is a Data Exchange Standard, Not a Database,)-.15 F
<9a>-.7 E F2(Thir)4.343 E 4.343(dB)-.37 G(ell-)-4.343 E(cor)151 294 Q
1.437(e/BCC Confer)-.37 F 1.437(ence on Electr)-.37 F 1.436
(onic Document Delivery)-.45 F(,)-.55 E F0 -.15(Pa)3.936 G(rsippan).15 E
2.736 -.65(y, N)-.15 H 1.936 -.25(ew J).65 H(erse).25 E(y)-.15 E
(\(October 13-15, 1992\).)151 306 Q 15(6. E.F)126 321.6 R 3.278(.C)-.8 G
(odd,)-3.278 E F2 .778(The Relational Model for Database Mana)3.278 F
-.1(ge)-.1 G .778(ment: V).1 F(er)-1.11 E .778(sion 2,)-.1 F F0
(Addison-)3.278 E -.8(We)151 333.6 S(sle).8 E 1.3 -.65(y, R)-.15 H
(eading, Massachusetts \(1990\).).65 E 15(7. James)126 349.2 R .579
(H. Coombs, Allen H. Renear)3.08 F 3.079(,a)-.4 G .579(nd Ste)-3.079 F
-.15(ve)-.25 G 3.079(nJ).15 G 3.079(.D)-3.079 G .579
(eRose, \231Markup Systems and)-3.079 F .364(the Future of Scholarly T)
151 361.2 R -.15(ex)-.7 G 2.864(tP).15 G(rocessing,)-2.864 E<9a>-.7 E F2
.364(Communications of the A)2.864 F(CM,)-.3 E F0 .365(30, 11, pp.)2.864
F(933-947 \(1987\).)151 373.2 Q 15(8. E.W)126 388.8 R 2.819(.D)-.92 G
.318(ijkstra, \231My Hopes of Computing Science,)-2.819 F<9a>-.7 E F2
(Pr)2.818 E .318(oceedings of the 4th Interna-)-.45 F .787
(tional Confer)151 400.8 R .787(ence on Softwar)-.37 F 3.287(eE)-.37 G
(ngineering)-3.287 E(,)-.1 E F0 .788(Munich, German)3.288 F 3.288(y\()
-.15 G .788(September 17-19,)-3.288 F(1979\).)151 412.8 Q 15
(9. Albertine)126 428.4 R(Gaur)2.91 E(,)-.4 E F2 2.91(AH)2.91 G .41
(istory of Writing \(r)-2.91 F -.15(ev)-.37 G .41(ised edition\),).15 F
F0(Abbe)2.91 E .41(ville Press, Ne)-.25 F 2.91(wY)-.25 G(ork,)-4.01 E
(N.Y)151 440.4 Q 2.5(.\()-1.29 G(1992\).)-2.5 E 10(10. C.F)126 456 R
4.09(.G)-.8 G(oldf)-4.09 E 1.59(arb, \231)-.1 F 4.09(AG)-.8 G 1.59
(eneralized Approach to Document Markup,)-4.09 F<9a>-.7 E F2(Pr)4.09 E
1.59(oceedings of)-.45 F .513(the A)151 468 R .513(CM SIGPLAN/SIGO)-.3 F
3.013(AS)-.55 G .513(ymposium on T)-3.013 F -.2(ex)-.92 G 3.013(tM).2 G
(anipulation,)-3.013 E F0 .512(2, 1 & 2, pp. 68-73,)3.012 F
(Portland, Ore)151 480 Q(gon \(June 8-10, 1981\).)-.15 E 10(11. Nelson)
126 495.6 R(Goodman,)2.5 E F2(Langua)2.5 E -.1(ge)-.1 G 2.5(so).1 G 2.5
(fA)-2.5 G(rt,)-2.5 E F0(Hack)2.5 E(et Publishing Co. \(1976\).)-.1 E 10
(12. Ro)126 511.2 R 4.347(yH)-.1 G(arris,)-4.347 E F2 1.847
(The Origin of Writing)4.347 F(,)-.1 E F0 1.847(Gerald Duckw)4.347 F
1.848(ord & Co., London, England)-.1 F(\(1986\).)151 523.2 Q 10
(13. Eric)126 538.8 R 1.504(A. Ha)4.004 F -.15(ve)-.2 G(lock,).15 E F2
(Pr)4.004 E 1.504(eface to Plato,)-.37 F F0(Harv)4.004 E 1.504(ard Uni)
-.25 F -.15(ve)-.25 G 1.504(rsity Press, Cambridge, Mas-).15 F
(sachusetts \(1963\).)151 550.8 Q 10(14. T)126 566.4 R -.15(ex)-.7 G
2.804(tE).15 G .304(ncoding Initiati)-2.804 F -.15(ve)-.25 G(,).15 E F2
.304(Guidelines for Electr)2.804 F .305(onic T)-.45 F -.2(ex)-.92 G
2.805(tE).2 G .305(ncoding and Inter)-2.805 F -.15(ch)-.37 G(ang).15 E
-.1(e,)-.1 G F0(Chapter 16,)151 578.4 Q F2(Se)2.5 E
(gmentation and Alignment)-.4 E F0 2.5(,C)C
(hicago, Illinois \(January 21, 1993\).)-2.5 E 10(15. W)126 594 R .473
(illiam K)-.4 F(ent,)-.25 E F2 .473
(Data and Reality: Basic Assumptions in Data Pr)2.973 F .473
(ocessing Reconsid-)-.45 F(er)151 606 Q(ed,)-.37 E F0
(North-Holland Publishing Co., Ne)2.5 E 2.5(wY)-.25 G(ork \(1978\).)-3.6
E 10(16. Brian)126 621.6 R 2.177 -.92(W. K)2.837 H .337
(ernighan, \231Issues and T).67 F(radeof)-.35 E .337
(fs in Document Preparation Systems,)-.25 F<9a>-.7 E F2(EP)2.837 E .743
('90, Pr)151 633.6 R .742(oceedings of the International Confer)-.45 F
.742(ence on Electr)-.37 F .742(onic Publishing)-.45 F 3.242(,D)-.1 G
(ocu-)-3.242 E 1.112(ment Manipulation, & T)151 645.6 R(ypo)-.74 E(gr)
-.1 E(aphy)-.15 E(,)-.55 E F0 1.113(pp. 1-16, Gaithersb)3.612 F(ur)-.2 E
1.113(g, Maryland \(September)-.18 F(1990\).)151 657.6 Q EP
%%Page: 19 20
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(19)476 66 Q 10(17. Chai)126 120 R .455
(Kim, \231Retrie)2.955 F -.25(va)-.25 G 2.955(lL).25 G .454
(anguage of Social Sciences and Natural Sciences: A Statis-)-2.955 F
1.141(tical In)151 132 R -.15(ve)-.4 G(stig).15 E(ation,)-.05 E<9a>-.7 E
/F1 10/Times-Italic@0 SF -.25(Jo)3.641 G 1.141
(urnal of the American Society for Information Science).25 F(,)-.1 E F0
(pp.)3.641 E(3-7, John W)151 144 Q(ilye & Sons, Inc. \(January 1982\).)
-.4 E 10(18. Da)126 159.6 R .48(vid M. Le)-.2 F(vy)-.25 E 2.979<2c99>
-.65 G -.8(To)-2.979 G .479(pics in Document Research,).8 F<9a>-.7 E F1
(Pr)2.979 E .479(oceedings of the A)-.45 F .479(CM Confer)-.3 F(-)-.2 E
3.035(ence on Document Pr)151 171.6 R 3.035(ocessing Systems,)-.45 F F0
3.035(pp. 187-193, Santa Fe, Ne)5.535 F 5.535(wM)-.25 G -.15(ex)-5.535 G
(ico).15 E(\(December 5-9, 1988\).)151 183.6 Q 10(19. Ian)126 199.2 R
.706(A. Macleod, Brent Nordin, Da)3.206 F .706(vid T)-.2 F 3.206(.B)-.74
G .706(arnard, and Doug Hamilton, \231)-3.206 F 3.205(AF)-.8 G(rame-)
-3.205 E -.1(wo)151 211.2 S 1.203(rk for De).1 F -.15(ve)-.25 G 1.204
(loping SGML Applications,).15 F<9a>-.7 E F1(Pr)3.704 E 1.204
(oceedings of Electr)-.45 F 1.204(onic Publishing)-.45 F('92,)151 223.2
Q F0 1.624(pp. 53-63, Cambridge Uni)4.124 F -.15(ve)-.25 G 1.623
(rsity Press, Lausanne, Switzerland \(April 7-10,).15 F(1992\).)151
235.2 Q 10(20. Douglas)126 250.8 R .957
(L. Medin, \231Concepts and Conceptual Structure,)3.457 F<9a>-.7 E F1
.958(American Psyc)3.458 F(holo)-.15 E(gist,)-.1 E F0
(44, 12, pp. 1469-1481 \(December 1989\).)151 262.8 Q 10(21. Gordon)126
278.4 R(Neal, \231TEI Still Stunts Scholarship,)2.5 E<9a>-.7 E F1
(Confer)2.5 E(ence Abstr)-.37 E(acts and Pr)-.15 E -.1(og)-.45 G -.15
(ra).1 G(mme).15 E(for ALLC-A)151 290.4 Q(CH '92,)-.3 E F0
(pp. 186-191, Christ Church, Oxford, England \(April 1992\).)2.5 E 10
(22. Brent)126 306 R .605(Nordin, Da)3.105 F .605(vid T)-.2 F 3.105(.B)
-.74 G .605(arnard, and Ian A. MacLeod, \231)-3.105 F 3.106(AR)-.8 G
-.25(ev)-3.106 G(ie).25 E 3.106(wo)-.25 G 3.106(ft)-3.106 G .606
(he Standard)-3.106 F(Generalized Markup Language,)151 318 Q<9a>-.7 E F1
(Computer)2.5 E 2.5(sa)-.1 G(nd Standar)-2.5 E(ds)-.37 E F0
(\(to appear\).)2.5 E 10(23. Zenon)126 333.6 R 1.84 -.92(W. P)2.5 H
(ylysh).92 E(yn, \231What')-.05 E 2.5(si)-.55 G 2.5(naM)-2.5 G(ind?,)
-2.5 E<9a>-.7 E F1(Synthese)2.5 E(,)-.1 E F0(70, pp. 97-122 \(1987\).)
2.5 E 10(24. V)126 349.2 R 1.215
(incent Quint, Marc Nanard, and Jacques Andr)-.6 F -4.165.835 G
3.714<2c99>4.165 G -1.15 -.8(To w)-3.714 H 1.214(ards Document Engineer)
.7 F(-)-.2 E(ing,)151 361.2 Q<9a>-.7 E F1 .126(EP 90, Pr)2.626 F .126
(oceedings of the International Confer)-.45 F .126(ence on Electr)-.37 F
.126(onic Publishing)-.45 F(,)-.1 E 4.406(Document Manipulation, & T)151
373.2 R(ypo)-.74 E(gr)-.1 E(aphy)-.15 E(,)-.55 E F0 4.406
(pp. 17-29, Gaithersb)6.906 F(ur)-.2 E 4.405(g, Maryland)-.18 F
(\(September 1990\).)151 385.2 Q 10(25. Darrell)126 400.8 R .965
(R. Raymond, \231Reading Source Code,)3.465 F 3.466<9a49>-.7 G .966
(BM Canada Laboratory T)-3.466 F(echnical)-.7 E
(Report TR 74.070, IBM Canada, T)151 412.8 Q
(oronto, Ontario \(October 1991\).)-.8 E 10(26. Darrell)126 428.4 R
1.117(R. Raymond, \231Fle)3.617 F 1.117(xible T)-.15 F -.15(ex)-.7 G
3.616(tD).15 G 1.116(isplay with)-3.616 F F1(Lector)3.616 E F0 -.7<2c9a>
C F1 1.116(IEEE Computer)4.316 F(,)-1.11 E F0 1.116(25, 8)3.616 F
(\(August 1992\).)151 440.4 Q 10(27. Darrell)126 456 R 2.3
(R. Raymond and Frank Wm. T)4.8 F 2.3(ompa, \231)-.8 F 2.3
(Applying Database Dependenc)-.8 F(y)-.15 E 2.087(Theory to Softw)151
468 R 2.086(are Engineering,)-.1 F 4.586<9a43>-.7 G 2.086
(S-92-56, Department of Computer Science,)-4.586 F(Uni)151 480 Q -.15
(ve)-.25 G(rsity of W).15 E(aterloo, W)-.8 E
(aterloo, Ontario \(December)-.8 E 2.5(,1)-.4 G(992\).)-2.5 E 10
(28. Frank)126 495.6 R .095(Wm. T)2.595 F .096
(ompa and Darrell R. Raymond, \231Database Design for a Dynamic Dic-)-.8
F .098(tionary\232 in)151 507.6 R F1(Resear)2.598 E .398 -.15(ch i)-.37
H 2.597(nH).15 G .097(umanities Computing I, P)-2.597 F(aper)-.8 E 2.597
(sf)-.1 G -.45(ro)-2.597 G 2.597(mt).45 G .097(he 1989 A)-2.597 F
(CH-ALLC)-.3 E(Confer)151 519.6 Q(ence)-.37 E(,)-.1 E F0
(ed. Ian Lancashire, Oxford Uni)2.5 E -.15(ve)-.25 G
(rsity Press \(September 1991\).).15 E 10(29. Brian)126 535.2 R -.35(Tr)
5.269 G -.2(av).35 G 2.769(is, \231SGML: It').2 F 5.269(sN)-.55 G 2.769
(ot Just for T)-5.269 F -.15(ex)-.7 G 5.269(tA).15 G -.15(ny)-5.269 G
(more,).15 E<9a>-.7 E F1(: The SGML).35
F(Ne)151 547.2 Q(wsletter)-.15 E F0(\(July 1992\).)2.5 E 10(30. Ben)126
562.8 R 1.311(Zion W)3.811 F 1.311(acholder and Martin G. Abe)-.8 F(gg,)
-.15 E F1 3.811(AP)3.811 G -.37(re)-3.811 G 1.311
(liminary Reconstruction of the).37 F 1.352(Unpublished Dead Sea Scr)151
574.8 R 1.353(olls: The Hebr)-.45 F 1.653 -.15(ew a)-.37 H 1.353(nd Ar)
.15 F 1.353(amaic T)-.15 F -.2(ex)-.92 G 1.353(ts fr).2 F 1.353
(om Cave F)-.45 F(our)-1.05 E(,)-1.11 E F0(Biblical Archaeology Society)
151 586.8 Q 2.5(,W)-.65 G(ashington, D.C. \(1991\).)-3.3 E 10
(31. Xinxin)126 602.4 R -.8(Wa)2.967 G .467(ng and Derick W).8 F .466
(ood, \231T)-.8 F(ab)-.8 E .466(ular Abstraction for T)-.2 F(ab)-.8 E
.466(ular Editing and F)-.2 F(or)-.15 E(-)-.2 E(matting,)151 614.4 Q<9a>
-.7 E F1(Pr)3.061 E .561(oceedings of 3r)-.45 F 3.061(dI)-.37 G .561
(nternational Confer)-3.061 F .561(ence for Y)-.37 F .561
(oung Computer Scien-)-.92 F(tists,)151 626.4 Q F0(p. Tsinghua Uni)2.5 E
-.15(ve)-.25 G(rsity Press, Beijing, China \(to appear 1993\).).15 E 10
(32. W)126 642 R .538(illiam Proctor W)-.4 F .538
(illiams and Craig S. Abbott,)-.4 F F1 .538(An Intr)3.038 F .538
(oduction to Biblio)-.45 F(gr)-.1 E(aphical)-.15 E 1.892(and T)151 654 R
-.2(ex)-.92 G 1.892(tual Studies, 2nd. Ed.,).2 F F0 1.892
(Modern Language Association of America, Ne)4.392 F(w)-.25 E EP
%%Page: 20 21
%%BeginPageSetup
BP
%%EndPageSetup
/F0 10/Times-Roman@0 SF(20)126 66 Q -1.1(Yo)151 120 S(rk, N.Y)1.1 E 2.5
(.\()-1.29 G(1989\).)-2.5 E EP
%%Trailer
end
%%EOF