graffiti 2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,77 @@
1
+ ---
2
+ # rdf.yaml
3
+ #
4
+ # Defines essential parts of RDF model of a Samizdat site. Don't touch
5
+ # it unless you know what you're doing.
6
+
7
+ # Namespaces
8
+ #
9
+ ns:
10
+ s: 'http://www.nongnu.org/samizdat/rdf/schema#'
11
+ tag: 'http://www.nongnu.org/samizdat/rdf/tag#'
12
+ items: 'http://www.nongnu.org/samizdat/rdf/items#'
13
+ rdf: 'http://www.w3.org/1999/02/22-rdf-syntax-ns#'
14
+ dc: 'http://purl.org/dc/elements/1.1/'
15
+ dct: 'http://purl.org/dc/terms/'
16
+ ical: 'http://www.w3.org/2002/12/cal#'
17
+
18
+ # Mapping of internal RDF properties to tables and fields. Statements
19
+ # over properties not listed here or in 'subproperty:' section below are
20
+ # reified using standard rdf::subject, rdf::predicate, and rdf::object
21
+ # properties, so at least these three and s::id must be mapped.
22
+ #
23
+ map:
24
+ 's::id': {resource: id}
25
+ 'dc::date': {resource: published_date}
26
+ 'dct::isPartOf': {resource: part_of}
27
+ 's::isPartOfSubProperty': {resource: part_of_subproperty}
28
+ 's::partSequenceNumber': {resource: part_sequence_number}
29
+
30
+ 'rdf::subject': {statement: subject}
31
+ 'rdf::predicate': {statement: predicate}
32
+ 'rdf::object': {statement: object}
33
+
34
+ 's::login': {member: login}
35
+ 's::fullName': {member: full_name}
36
+ 's::email': {member: email}
37
+
38
+ 'dc::title': {message: title}
39
+ 'dc::creator': {message: creator}
40
+ 'dc::format': {message: format}
41
+ 'dc::language': {message: language}
42
+ 's::openForAll': {message: open}
43
+ 's::hidden': {message: hidden}
44
+ 's::locked': {message: locked}
45
+ 's::content': {message: content}
46
+ 's::htmlFull': {message: html_full}
47
+ 's::htmlShort': {message: html_short}
48
+
49
+ 's::rating': {statement: rating}
50
+
51
+ 's::voteProposition': {vote: proposition}
52
+ 's::voteMember': {vote: member}
53
+ 's::voteRating': {vote: rating}
54
+
55
+ # Map of properties into lists of their subproperties. For each property
56
+ # listed here, an additional qualifier field named <field>_subproperty
57
+ # is defined in the same table (as defined under 'map:' above) referring
58
+ # to resource id identifying the subproperty (normally a uriref resource
59
+ # holding uriref of the subproperty). Only one level of subproperty
60
+ # relation is supported, all subsubproperties must be listed directly
61
+ # under root property.
62
+ #
63
+ subproperties:
64
+ 'dct::isPartOf': [ 's::inReplyTo', 'dct::isVersionOf',
65
+ 's::isTranslationOf', 's::subTagOf' ]
66
+
67
+ # Map of transitive RDF properties into tables that hold their
68
+ # transitive closures. The format of the table is as follows: 'resource'
69
+ # field refers to the subject resource id, property field (and qualifier
70
+ # field in case of subproperty) has the same name as in the main table
71
+ # (as defined under 'map:' above) and holds reference to predicate
72
+ # object, and 'distance' field holds the distance from subject to object
73
+ # in the RDF graph.
74
+ #
75
+ transitive_closure:
76
+ 'dct::isPartOf': part
77
+
@@ -0,0 +1,266 @@
1
+ -- Samizdat Database Triggers - PostgreSQL
2
+ --
3
+ -- Copyright (c) 2002-2011 Dmitry Borodaenko <angdraug@debian.org>
4
+ --
5
+ -- This program is free software.
6
+ -- You can distribute/modify this program under the terms of
7
+ -- the GNU General Public License version 3 or later.
8
+ --
9
+
10
+ CREATE FUNCTION insert_resource() RETURNS TRIGGER AS $$
11
+ BEGIN
12
+ IF NEW.id IS NULL THEN
13
+ INSERT INTO resource (literal, uriref, label)
14
+ VALUES ('false', 'false', TG_ARGV[0]);
15
+ NEW.id := currval('resource_id_seq');
16
+ END IF;
17
+ RETURN NEW;
18
+ END;
19
+ $$ LANGUAGE 'plpgsql';
20
+
21
+ CREATE TRIGGER insert_statement BEFORE INSERT ON statement
22
+ FOR EACH ROW EXECUTE PROCEDURE insert_resource('statement');
23
+
24
+ CREATE TRIGGER insert_member BEFORE INSERT ON member
25
+ FOR EACH ROW EXECUTE PROCEDURE insert_resource('member');
26
+
27
+ CREATE TRIGGER insert_message BEFORE INSERT ON message
28
+ FOR EACH ROW EXECUTE PROCEDURE insert_resource('message');
29
+
30
+ CREATE TRIGGER insert_vote BEFORE INSERT ON vote
31
+ FOR EACH ROW EXECUTE PROCEDURE insert_resource('vote');
32
+
33
+ CREATE FUNCTION delete_resource() RETURNS TRIGGER AS $$
34
+ BEGIN
35
+ DELETE FROM resource WHERE id = OLD.id;
36
+ RETURN NULL;
37
+ END;
38
+ $$ LANGUAGE 'plpgsql';
39
+
40
+ CREATE TRIGGER delete_statement AFTER DELETE ON statement
41
+ FOR EACH ROW EXECUTE PROCEDURE delete_resource();
42
+
43
+ CREATE TRIGGER delete_member AFTER DELETE ON member
44
+ FOR EACH ROW EXECUTE PROCEDURE delete_resource();
45
+
46
+ CREATE TRIGGER delete_message AFTER DELETE ON message
47
+ FOR EACH ROW EXECUTE PROCEDURE delete_resource();
48
+
49
+ CREATE TRIGGER delete_vote AFTER DELETE ON vote
50
+ FOR EACH ROW EXECUTE PROCEDURE delete_resource();
51
+
52
+ CREATE FUNCTION select_subproperty(value resource.id%TYPE, subproperty resource.id%TYPE) RETURNS resource.id%TYPE AS $$
53
+ BEGIN
54
+ IF subproperty IS NULL THEN
55
+ RETURN NULL;
56
+ ELSE
57
+ RETURN value;
58
+ END IF;
59
+ END;
60
+ $$ LANGUAGE 'plpgsql';
61
+
62
+ CREATE FUNCTION calculate_statement_rating(statement_id statement.id%TYPE) RETURNS statement.rating%TYPE AS $$
63
+ BEGIN
64
+ RETURN (SELECT AVG(rating) FROM vote WHERE proposition = statement_id);
65
+ END;
66
+ $$ LANGUAGE 'plpgsql';
67
+
68
+ CREATE FUNCTION update_nrelated(tag_id resource.id%TYPE) RETURNS VOID AS $$
69
+ DECLARE
70
+ dc_relation resource.label%TYPE := 'http://purl.org/dc/elements/1.1/relation';
71
+ s_subtag_of resource.label%TYPE := 'http://www.nongnu.org/samizdat/rdf/schema#subTagOf';
72
+ s_subtag_of_id resource.id%TYPE;
73
+ n tag.nrelated%TYPE;
74
+ supertag RECORD;
75
+ BEGIN
76
+ -- update nrelated
77
+ SELECT COUNT(*) INTO n
78
+ FROM statement s
79
+ INNER JOIN resource p ON s.predicate = p.id
80
+ WHERE p.label = dc_relation AND s.object = tag_id AND s.rating > 0;
81
+
82
+ UPDATE tag SET nrelated = n WHERE id = tag_id;
83
+ IF NOT FOUND THEN
84
+ INSERT INTO tag (id, nrelated) VALUES (tag_id, n);
85
+ END IF;
86
+
87
+ -- update nrelated_with_subtags for this tag and its supertags
88
+ SELECT id INTO s_subtag_of_id FROM resource
89
+ WHERE label = s_subtag_of;
90
+
91
+ FOR supertag IN (
92
+ SELECT tag_id AS id, 0 AS distance
93
+ UNION
94
+ SELECT part_of AS id, distance FROM part
95
+ WHERE id = tag_id
96
+ AND part_of_subproperty = s_subtag_of_id
97
+ ORDER BY distance ASC)
98
+ LOOP
99
+ UPDATE tag
100
+ SET nrelated_with_subtags = nrelated + COALESCE((
101
+ SELECT SUM(subt.nrelated)
102
+ FROM part p
103
+ INNER JOIN tag subt ON subt.id = p.id
104
+ WHERE p.part_of = supertag.id
105
+ AND p.part_of_subproperty = s_subtag_of_id), 0)
106
+ WHERE id = supertag.id;
107
+ END LOOP;
108
+ END;
109
+ $$ LANGUAGE 'plpgsql';
110
+
111
+ CREATE FUNCTION update_nrelated_if_subtag(tag_id resource.id%TYPE, property resource.id%TYPE) RETURNS VOID AS $$
112
+ DECLARE
113
+ s_subtag_of resource.label%TYPE := 'http://www.nongnu.org/samizdat/rdf/schema#subTagOf';
114
+ s_subtag_of_id resource.id%TYPE;
115
+ BEGIN
116
+ SELECT id INTO s_subtag_of_id FROM resource
117
+ WHERE label = s_subtag_of;
118
+
119
+ IF property = s_subtag_of_id THEN
120
+ PERFORM update_nrelated(tag_id);
121
+ END IF;
122
+ END;
123
+ $$ LANGUAGE 'plpgsql';
124
+
125
+ CREATE FUNCTION update_rating() RETURNS TRIGGER AS $$
126
+ DECLARE
127
+ dc_relation resource.label%TYPE := 'http://purl.org/dc/elements/1.1/relation';
128
+ old_rating statement.rating%TYPE;
129
+ new_rating statement.rating%TYPE;
130
+ tag_id resource.id%TYPE;
131
+ predicate_uriref resource.label%TYPE;
132
+ BEGIN
133
+ -- save some values for later reference
134
+ SELECT s.rating, s.object, p.label
135
+ INTO old_rating, tag_id, predicate_uriref
136
+ FROM statement s
137
+ INNER JOIN resource p ON s.predicate = p.id
138
+ WHERE s.id = NEW.proposition;
139
+
140
+ -- set new rating of the proposition
141
+ new_rating := calculate_statement_rating(NEW.proposition);
142
+ UPDATE statement SET rating = new_rating WHERE id = NEW.proposition;
143
+
144
+ -- check if new rating reverts truth value of the proposition
145
+ IF predicate_uriref = dc_relation
146
+ AND (((old_rating IS NULL OR old_rating <= 0) AND new_rating > 0) OR
147
+ (old_rating > 0 AND new_rating <= 0))
148
+ THEN
149
+ PERFORM update_nrelated(tag_id);
150
+ END IF;
151
+
152
+ RETURN NEW;
153
+ END;
154
+ $$ LANGUAGE 'plpgsql';
155
+
156
+ CREATE TRIGGER update_rating AFTER INSERT OR UPDATE OR DELETE ON vote
157
+ FOR EACH ROW EXECUTE PROCEDURE update_rating();
158
+
159
+ CREATE FUNCTION before_update_part() RETURNS TRIGGER AS $$
160
+ BEGIN
161
+ IF TG_OP = 'INSERT' THEN
162
+ IF NEW.part_of IS NULL THEN
163
+ RETURN NEW;
164
+ END IF;
165
+ ELSIF TG_OP = 'UPDATE' THEN
166
+ IF (NEW.part_of IS NULL AND OLD.part_of IS NULL) OR
167
+ ((NEW.part_of = OLD.part_of) AND (NEW.part_of_subproperty = OLD.part_of_subproperty))
168
+ THEN
169
+ -- part_of is unchanged, do nothing
170
+ RETURN NEW;
171
+ END IF;
172
+ END IF;
173
+
174
+ -- check for loops
175
+ IF NEW.part_of = NEW.id OR NEW.part_of IN (
176
+ SELECT id FROM part WHERE part_of = NEW.id)
177
+ THEN
178
+ -- unset part_of, but don't fail whole query
179
+ NEW.part_of = NULL;
180
+ NEW.part_of_subproperty = NULL;
181
+
182
+ IF TG_OP != 'INSERT' THEN
183
+ -- check it was a subtag link
184
+ PERFORM update_nrelated_if_subtag(OLD.id, OLD.part_of_subproperty);
185
+ END IF;
186
+
187
+ RETURN NEW;
188
+ END IF;
189
+
190
+ RETURN NEW;
191
+ END;
192
+ $$ LANGUAGE 'plpgsql';
193
+
194
+ CREATE TRIGGER before_update_part BEFORE INSERT OR UPDATE ON resource
195
+ FOR EACH ROW EXECUTE PROCEDURE before_update_part();
196
+
197
+ CREATE FUNCTION after_update_part() RETURNS TRIGGER AS $$
198
+ BEGIN
199
+ IF TG_OP = 'INSERT' THEN
200
+ IF NEW.part_of IS NULL THEN
201
+ RETURN NEW;
202
+ END IF;
203
+ ELSIF TG_OP = 'UPDATE' THEN
204
+ IF (NEW.part_of IS NULL AND OLD.part_of IS NULL) OR
205
+ ((NEW.part_of = OLD.part_of) AND (NEW.part_of_subproperty = OLD.part_of_subproperty))
206
+ THEN
207
+ -- part_of is unchanged, do nothing
208
+ RETURN NEW;
209
+ END IF;
210
+ END IF;
211
+
212
+ IF TG_OP != 'INSERT' THEN
213
+ IF OLD.part_of IS NOT NULL THEN
214
+ -- clean up links generated for old part_of
215
+ DELETE FROM part
216
+ WHERE id IN (
217
+ -- for old resource...
218
+ SELECT OLD.id
219
+ UNION
220
+ --...and all its parts, ...
221
+ SELECT id FROM part WHERE part_of = OLD.id)
222
+ AND part_of IN (
223
+ -- ...remove links to all parents of old resource
224
+ SELECT part_of FROM part WHERE id = OLD.id)
225
+ AND part_of_subproperty = OLD.part_of_subproperty;
226
+ END IF;
227
+ END IF;
228
+
229
+ IF TG_OP != 'DELETE' THEN
230
+ IF NEW.part_of IS NOT NULL THEN
231
+ -- generate links to the parent and grand-parents of new resource
232
+ INSERT INTO part (id, part_of, part_of_subproperty, distance)
233
+ SELECT NEW.id, NEW.part_of, NEW.part_of_subproperty, 1
234
+ UNION
235
+ SELECT NEW.id, part_of, NEW.part_of_subproperty, distance + 1
236
+ FROM part
237
+ WHERE id = NEW.part_of
238
+ AND part_of_subproperty = NEW.part_of_subproperty;
239
+
240
+ -- generate links from all parts of new resource to all its parents
241
+ INSERT INTO part (id, part_of, part_of_subproperty, distance)
242
+ SELECT child.id, parent.part_of, NEW.part_of_subproperty,
243
+ child.distance + parent.distance
244
+ FROM part child
245
+ INNER JOIN part parent
246
+ ON parent.id = NEW.id
247
+ AND parent.part_of_subproperty = NEW.part_of_subproperty
248
+ WHERE child.part_of = NEW.id
249
+ AND child.part_of_subproperty = NEW.part_of_subproperty;
250
+ END IF;
251
+ END IF;
252
+
253
+ -- check if subtag link was affected
254
+ IF TG_OP != 'DELETE' THEN
255
+ PERFORM update_nrelated_if_subtag(NEW.id, NEW.part_of_subproperty);
256
+ END IF;
257
+ IF TG_OP != 'INSERT' THEN
258
+ PERFORM update_nrelated_if_subtag(OLD.id, OLD.part_of_subproperty);
259
+ END IF;
260
+
261
+ RETURN NEW;
262
+ END;
263
+ $$ LANGUAGE 'plpgsql';
264
+
265
+ CREATE TRIGGER after_update_part AFTER INSERT OR UPDATE OR DELETE ON resource
266
+ FOR EACH ROW EXECUTE PROCEDURE after_update_part();
@@ -0,0 +1,462 @@
1
+ \documentclass{llncs}
2
+ \usepackage{makeidx} % allows for indexgeneration
3
+ \usepackage[pdfpagescrop={92 112 523 778},a4paper=false,
4
+ pdfborder={0 0 0}]{hyperref}
5
+ \emergencystretch=8pt
6
+ %
7
+ \begin{document}
8
+ \mainmatter % start of the contributions
9
+ %
10
+ \title{Model for Collaborative Decision Making Based on RDF Reification}
11
+ \toctitle{Model for Collaborative Decision Making Based on RDF Reification}
12
+ \titlerunning{Collaboration and RDF Reification}
13
+ %
14
+ \author{Dmitry Borodaenko}
15
+ \authorrunning{Dmitry Borodaenko} % abbreviated author list (for running head)
16
+ %%%% modified list of authors for the TOC (add the affiliations)
17
+ \tocauthor{Dmitry Borodaenko}
18
+ %
19
+ \institute{\email{angdraug@debian.org}}
20
+
21
+ \maketitle % typeset the title of the contribution
22
+
23
+ \begin{abstract}
24
+ This paper presents a novel approach to online collaboration on the Web,
25
+ intended as technical means to make collective decisions in situations when
26
+ consensus fails. It is proposed that participants of the process are allowed
27
+ to create statements about site resources and, by the means of RDF
28
+ reification, to assert personal approval of such statements. Arbitrary
29
+ algorithms may then be used to determine validity of a statement in a given
30
+ context from the set of approval statements by different participants. The
31
+ paper goes on to discuss applicability of the proposed approach in the areas
32
+ of open-source development and independent media, and describes its
33
+ implementation in the Samizdat open publishing and collaboration system.
34
+ \end{abstract}
35
+
36
+
37
+ \section{Introduction}
38
+
39
+ Extensive growth of Internet over the last decades introduced a new form of
40
+ human collaboration: online communities. Availability of cheap digital
41
+ communication media has made it possible to form large distributed projects,
42
+ bringing together participants who would be otherwise unable to cooperate.
43
+
44
+ As more and more projects go online and spread across the globe, it becomes
45
+ apparent that new opportunities in remote cooperation also bring forth new
46
+ challenges. As observed by Steven Talbott\cite{fdnc}, technogical means do not
47
+ provide a full substitute for a real person-to-person relations, ``technology
48
+ is not a community''. A well-known example of this is the fact that it is
49
+ vital for an online communty to augment indirect and impersonal digital
50
+ communications with live meetings. However, even regular live meetings do not
51
+ solve all of the remote cooperation problems as they are limited in time and
52
+ scope, and thus can't happen often enough nor include all of the interested
53
+ parties into communication. In particular, one of the problems of online
54
+ communities that is begging for a new and better technical solution is
55
+ decision making and dispute resolution.
56
+
57
+ While it is most common that online communities are formed by volunteers,
58
+ their forms of governance are not necessarily democratic and vary widely, from
59
+ primitive single-person leadership and meritocracy in less formal technical
60
+ projects to consensus and majority voting in more complicated situations.
61
+
62
+ Usually, decision making in online volunteer projects is carried out via
63
+ traditional communication means, such as IRC channels, mailing lists,
64
+ newsgroups, etc., with rare exceptions such as the Debian project which
65
+ employs its own Devotee voting system based on PGP authentication and Concorde
66
+ vote counting\cite{debian-constitution}, and the Wikipedia project which
67
+ relies on a Wiki collaborative publishing system and enforces consensus among
68
+ its contributors. The scale and the level of quality achieved by the latter
69
+ two projects demonstrates that formalized collaboration process is as
70
+ important for volunteer projects as elsewhere: while sufficient to determine
71
+ rough consensus, traditional communications require participants to come up
72
+ with informal means of dispute resolution, making the whole process overly
73
+ dependent on interpersonal attitudes and communicative skills within group.
74
+
75
+ It is not to say that Debian or Wikipedia processes are perfect and need not
76
+ be improved. The strict consensus required by the Wikipedia Editors Policy
77
+ discourages dissenting minority from participation, while full-scale voting
78
+ system like Debian Devotee can't be used for every minor day-to-day decision
79
+ because of the high overhead involved and the limits imposed by the ballot
80
+ form.
81
+
82
+ This paper describes how RDF statement approval based on reification can be
83
+ applied to the problem of online decision making in diverse and politically
84
+ intensive distributed projects, and proposes a generic semantic model which
85
+ can be used in a wide range of applications involving online collaboration.
86
+ The proposed model is implemented in the Samizdat open-publishing and
87
+ collaboration engine, described later in the paper.
88
+
89
+
90
+ \section{Collaboration Model}
91
+
92
+ The collaboration model implemented by Samizdat evolves around the concept of
93
+ \emph{open editing}\cite{opened}, which includes the processes of publishing,
94
+ structuring, and filtering online content. ``Open'' part of open editing
95
+ implies that the collaboration process is visible to all participants, and
96
+ roles of readers and editors are available equally to everyone.
97
+ \emph{Publishing} involves posting new documents, comments, and revised
98
+ documents. \emph{Structuring} involves categorization and appraisal of
99
+ publications and other actions of fellow participants. \emph{Filtering}
100
+ process is intended to reduce information flow to a comprehensible level by
101
+ presenting a user with resources of highest quality and relevance. Each of
102
+ these processes requires a fair amount of decision making to be done, which
103
+ means that its effectiveness can be greatly improved by automating some
104
+ aspects of the decision making procedure.
105
+
106
+
107
+ \section{Collective Statement Approval}
108
+ %
109
+ \subsection{Focus-Centered Site Structure}
110
+
111
+ In the proposed collaboration model, RDF statements are used as a generic
112
+ mechanism for structuring site content. While it is possible to make any kinds
113
+ of statements about site resources, the most important kind of statement is
114
+ the one that relates a resource to a so-called ``focus''\cite{concepts}.
115
+ \emph{Focus} is a kind of resource that, when related by an RDF statement to
116
+ other resources, allows to group similar resources together and to evaluate
117
+ resources against different criteria. In some sense, all activities of project
118
+ members are represented as relations between resources and focuses.
119
+
120
+ Dynamically grouping resources around different focuses allows project members
121
+ to concentrate on the resources that are most relevant to their area of
122
+ interests and provide best quality. Use of RDF for site structure description
123
+ makes it possible to store and exchange filters for site resource selection in
124
+ the form of RDF queries, thus allowing participants to share their preferences
125
+ and ensuring interoperability with RDF-aware agents.
126
+
127
+ Since any resource can be used as a focus, it is possible that project members
128
+ define their own focuses, and relate focuses one to another. In a sufficiently
129
+ large and intensive project, this feature should help site structure to evolve
130
+ in accordance with usage patterns of different groups of users.
131
+
132
+ \subsection{RDF Reification}
133
+
134
+ RDF reification provides a mechanism for describing RDF statements. As defined
135
+ in ``RDF Semantics''\cite{rdf-mt}, assertion of reification of RDF statement
136
+ means that a document exists containing a triple token instantiating the
137
+ statement. The reified triple is a resource which can be described in the same
138
+ way as any other resource. It is important to note that there can be several
139
+ triple tokens with the same subject, object, and predicate, and, according to
140
+ RDF reification semantics, such tokens should be treated as separate
141
+ resources, possibly with different composition or provenance information
142
+ attached to each.
143
+
144
+ \subsection{Proposition and Vote}
145
+
146
+ In the proposed model, all statements are reified, and may be voted upon by
147
+ project members. To distinguish statements with attached votes, they are
148
+ called ``propositions''. \emph{Proposition} is a subclass of RDF statement
149
+ which can be approved or disapproved by votes of project members. Accordingly,
150
+ \emph{vote} is a record of vote cast in favor or against particular
151
+ proposition by particular member, and \emph{rating} is a denotation of
152
+ approval of the proposition as determined from individual votes.
153
+
154
+ Exact mechanism of rating calculation can be determined by each site, or even
155
+ each user, individually, according to average value of votes cast, level of
156
+ trust existing between the user and particular voters, absolute number of
157
+ votes cast, etc. Since individual votes are recorded in RDF and are available
158
+ for later extraction, rating can be calculated at any time using any formula
159
+ that suits the end user best. Some users may choose to share their view of the
160
+ site resources, and publish their filters in the form of RDF queries.
161
+
162
+ Default rating system in Samizdat lets voter select from ratings ``$-2$''
163
+ (no), ``$-1$'' (not likely), ``$0$'' (uncertain), ``$1$'' (likely), ``$2$''
164
+ (yes). Total rating of proposition is equal to the average value of all votes
165
+ cast for the proposition; resources with rating below ``$-1$'' are hidden from
166
+ view.
167
+
168
+
169
+ \section{Target Applications and Use Cases}
170
+ %
171
+ \subsection{Open Publishing}
172
+
173
+ While it is vital for any project to come up with fair and predictable methods
174
+ of decision making, it's hard to find a more typical example than the
175
+ Indymedia network, international open publishing project with the aim of
176
+ providing the public with unbiased news source\cite{openpub}. Since the main
177
+ focus of Indymedia is politics, and since it is explicitly open for everyone,
178
+ independent media centers are used by people from all parts of political
179
+ spectrum, and often become a place of heated debate, or even target of flood
180
+ attacks.
181
+
182
+ This conflict between fairness and political bias, as well as sheer amount of
183
+ information flowing through the news network, creates a need for a more
184
+ flexible categorization and filtering system that would take the burden and
185
+ responsibility of moderation off from site administrators. The issue of
186
+ developing an open editing system was raised by Indymedia project participants
187
+ in January 2002, but, to date, implementations of this concept are not ready
188
+ for production use. The Active2 project\cite{active2} which has set forth to
189
+ fulfil that role is still in the alpha stage of the development, and, unlike
190
+ Samizdat, limits its use of RDF to describing its resources with Dublin Core
191
+ meta-data.
192
+
193
+ Implementation of an open editing system was one of the initial goals of the
194
+ Samizdat project\cite{oscom3}, and deployment of the Samizdat engine by an
195
+ independent media center would become a deciding trial of vitality of the
196
+ proposed collaboration model in a real-world environment.
197
+
198
+ \subsection{Documentation Development}
199
+
200
+ Complexity level of modern computer systems makes it impossible to develop and
201
+ operate them without extensive user and developer manuals which document
202
+ intended behaviour of a system and describe solutions to typical user
203
+ problems. Ultimately, such manuals reflect collective knowledge about a
204
+ system, and may require input from many different people with different
205
+ perspectives. On the other hand, in order to be useful to different people,
206
+ documentation should be well-structured and easy to navigate.
207
+
208
+ The most popular solution for collaborative documentation development to date
209
+ is \emph{Wiki}, a combination of very simple hypertext markup and ability to
210
+ edit documents within an HTML form. Such simplicity makes Wiki easy to use,
211
+ but in the same time limits its applicability to large bodies of
212
+ documentation. Due to being limited to basic hypertext without categorization
213
+ and filtering capabilities, Wiki sites require huge amount of manual editing
214
+ done by trusted maintainers in order to keep the site structure from falling
215
+ behind a growing amount of available information, and to protect it from
216
+ vandals. Although there are successful examples of large Wiki sites (most
217
+ prominent being the Wikipedia project), Wiki does not provide sufficient
218
+ infrastructure for development and maintainance of complex technical
219
+ documentation.
220
+
221
+ Combination of the Wiki approach with RDF metadata, along with implementation
222
+ of the proposed collaborative decision making model for determination of
223
+ documentation structure, would allow to make significant progress in the
224
+ adoption of the open-source software which is often suffering from a lack of
225
+ comprehensive and up-to-date documentation.
226
+
227
+ \subsection{Bug Tracking}
228
+
229
+ Bug-tracking tools have grown to become essential component of any software
230
+ development process. However, despite wide adoption, bug-tracking software has
231
+ not yet reached maturity: interoperability between different tools is missing;
232
+ incompatible issue classifications and work flows complicate status
233
+ syncronization between companies collaborating on a single project; lack of
234
+ integration with time-management, document management, version control and
235
+ other kinds of applications increases amount of routine work done by project
236
+ manager.
237
+
238
+ On the other hand, development of integrated project management systems shows
239
+ that the most important problem in project management automation is
240
+ convergence of information from all sources in a single focal point. For such
241
+ convergence to become possible, unified process flow model, based on open
242
+ standards such as RDF, should be adopted across all information sources, from
243
+ source code version control to developer forums. Since strict provenance
244
+ tracking is a key requirement for such model, the proposed reification-based
245
+ approach may be employed to satisfy it.
246
+
247
+
248
+ \section{Samizdat Engine}
249
+ %
250
+ \subsection{Project Status}
251
+
252
+ Samizdat engine is implemented in the Ruby programming language and relies on
253
+ the PostgreSQL database management system for RDF storage. Other programs
254
+ required for Samizdat deployment are Ruby/Postgres, Ruby/DBI, and YAML4R
255
+ libraries for Ruby, and Apache web server with mod\_ruby module. Samizdat is
256
+ free software and does not require any non-free software to
257
+ run\cite{impl-report}.
258
+
259
+ Samizdat project development started in December 2002, first public release
260
+ was announced in June 2003. As of the second beta version 0.5.1, released in
261
+ March 2004, Samizdat provided basic set of open publishing functionality,
262
+ including registering site members, publishing and replying to messages,
263
+ uploading multimedia messages, voting on relation of site focuses to
264
+ resources, creating and managing new focuses, hand-editing or using GUI for
265
+ constructing and publishing Squish queries that can be used to search and
266
+ filter site resources. Next major release 0.6.0 is expected to add
267
+ collaborative documentation development functionality.
268
+
269
+ \subsection{Samizdat Schema}
270
+
271
+ Core representation of Samizdat content is RDF. Any new resource published on
272
+ Samizdat site is automatically assigned a unique numberic ID, which, when
273
+ appended to the base site URL, forms resource URIref. This ID may be accessed
274
+ via {\tt id} property. Publication time stamp is recorded in {\tt dc:date}
275
+ property (here and below, ``{\tt dc:}'' prefix refers to the Dublin Core
276
+ namespace):
277
+
278
+ \begin{verbatim}
279
+ :id
280
+ rdfs:domain rdfs:Resource .
281
+
282
+ dc:date
283
+ rdfs:domain rdfs:Resource .
284
+ \end{verbatim}
285
+
286
+ {\tt Member} is a registered user of a Samizdat site (synonyms: poster,
287
+ visitor, reader, author, creator). Members can post messages, create focuses,
288
+ relate messages to focuses, vote on relations, view messages, use and publish
289
+ filters based on relations between messages and focuses.
290
+
291
+ \begin{verbatim}
292
+ :Member
293
+ rdfs:subClassOf rdfs:Resource .
294
+
295
+ :login
296
+ rdfs:domain :Member ;
297
+ rdfs:range rdfs:Literal .
298
+ \end{verbatim}
299
+
300
+ Resources are related to focuses with {\tt dc:relation} property:
301
+
302
+ \begin{verbatim}
303
+ :Focus
304
+ rdfs:subClassOf rdfs:Resource .
305
+
306
+ dc:relation
307
+ rdfs:domain rdfs:Resource ;
308
+ rdfs:range :Focus .
309
+ \end{verbatim}
310
+
311
+ {\tt Proposition} is an RDF statement with {\tt rating} property. Value of
312
+ {\tt rating} is calculated from {\tt voteRating} values of individual {\tt
313
+ Vote} resources attached to this proposition via {\tt voteProposition}
314
+ property:
315
+
316
+ \begin{verbatim}
317
+ :Proposition
318
+ rdfs:subClassOf rdf:Statement .
319
+
320
+ :rating
321
+ rdfs:domain :Proposition ;
322
+ rdfs:range rdfs:Literal .
323
+
324
+ :Vote
325
+ rdfs:subClassOf rdfs:Resource .
326
+
327
+ :voteProposition
328
+ rdfs:domain :Vote ;
329
+ rdfs:range :Proposition .
330
+
331
+ :voteMember
332
+ rdfs:domain :Vote ;
333
+ rdfs:range :Member .
334
+
335
+ :voteRating
336
+ rdfs:domain :Vote ;
337
+ rdfs:range rdfs:Literal .
338
+ \end{verbatim}
339
+
340
+ Parts of Samizdat schema that are not relevant to the discussed collective
341
+ decision making model, such as discussion threads, version control, and
342
+ aggregate messages, were omitted. Full Samizdat schema in N3 notation can be
343
+ found in Samizdat source code package.
344
+
345
+ \subsection{RDF Storage Implementation}
346
+
347
+ To address scalability concerns, Samizdat extends traditional relational
348
+ representation of RDF as a table of \{subject, object, predicate\} triples
349
+ with a unique RDF-to-relational query translation technology. Most highly used
350
+ RDF properties of Samizdat schema are mapped into fields of \emph{internal
351
+ resource tables} corresponding to resource classes, with id of the record
352
+ referencing to the {\tt Resource} table; all other properties are recorded as
353
+ triples in the {\tt Statement} table. Detailed explanation of the
354
+ RDF-to-relational mapping can be found in ``Samizdat RDF
355
+ Storage''\cite{rdf-storage} document.
356
+
357
+ To demonstrate usage of the Samizdat RDF schema described earlier in this
358
+ section, the exerpt of Ruby code responsible for individual vote rating
359
+ assignment is quoted below.
360
+
361
+ \begin{verbatim}
362
+ def rating=(value)
363
+ value = Focus.validate_rating(value)
364
+ if value then
365
+ rdf.assert %{
366
+ UPDATE ?rating = '#{value}'
367
+ WHERE (rdf::subject ?stmt #{resource.id})
368
+ (rdf::predicate ?stmt dc::relation)
369
+ (rdf::object ?stmt #{@id})
370
+ (s::voteProposition ?vote ?stmt)
371
+ (s::voteMember ?vote #{session.id})
372
+ (s::voteRating ?vote ?rating)
373
+ USING PRESET NS}
374
+ @rating = nil # invalidate rating cache
375
+ end
376
+ end
377
+ \end{verbatim}
378
+
379
+ In this attribute assignment method of {\tt Focus} class, RDF assertion is
380
+ recorded in extended Squish syntax and populated with variables storing the
381
+ rating {\tt value}, resource identifier {\tt resource.id}, focus identifier
382
+ {\tt @id}, and identifier of registered member {\tt session.id}. When the
383
+ Samizdat RDF storage layer updates {\tt Vote.voteRating}, average value of
384
+ corresponding {\tt Proposition.rating} is recalculated by a stored procedure.
385
+
386
+
387
+ \section{Conclusions}
388
+
389
+ Initially started as an RDF-based open-publishing engine, Samizdat project
390
+ opens a new approach to online collaboration in general. Proposed model of
391
+ collective statement approval via RDF reification is applicable in a large
392
+ range of problem domains, including documentation development and bug
393
+ tracking.
394
+
395
+ Implementation of the proposed model in the Samizdat engine proves viability
396
+ of RDF not only as a metadata interchange format, but also as a data model
397
+ that may be employed by software architects in innovative ways. Key role
398
+ played by RDF reification in the described model shows that this comparatively
399
+ obscure part of RDF standard deserves broader mindshare among Semantic Web
400
+ developers.
401
+
402
+
403
+ % ---- Bibliography ----
404
+ %
405
+ \begin{thebibliography}{19}
406
+ %
407
+ \bibitem {openpub}
408
+ Arnison, Matthew:
409
+ Open publishing is the same as free software, 2002\\
410
+ http://www.cat.org.au/maffew/cat/openpub.html
411
+
412
+ \bibitem {concepts}
413
+ Borodaenko, Dmitry:
414
+ Samizdat Concepts, December 2002\\
415
+ http://savannah.nongnu.org/cgi-bin/viewcvs/samizdat/samizdat/doc/\\
416
+ concepts.txt
417
+
418
+ \bibitem {rdf-storage}
419
+ Borodaenko, Dmitry:
420
+ Samizdat RDF Storage, December 2002\\
421
+ http://savannah.nongnu.org/cgi-bin/viewcvs/samizdat/samizdat/doc/\\
422
+ rdf-storage.txt
423
+
424
+ \bibitem {oscom3}
425
+ Borodaenko, Dmitry:
426
+ Samizdat --- RDF model for an open publishing and cooperation engine. Third
427
+ International OSCOM Conference, Berkman Center for Internet and Society,
428
+ Harvard Law School, May 2003\\
429
+ http://slideml.bitflux.ch/files/slidesets/503/title.html
430
+
431
+ \bibitem {impl-report}
432
+ Borodaenko, Dmitry:
433
+ Samizdat RDF Implementation Report, September 2003\\
434
+ http://lists.w3.org/Archives/Public/www-rdf-interest/2003Sep/0043.html
435
+
436
+ \bibitem {debian-constitution}
437
+ Debian Constitution. Debian Project, 1999\\
438
+ http://www.debian.org/devel/constitution
439
+
440
+ \bibitem {rdf-mt}
441
+ Hayes, Patrick:
442
+ RDF Semantics. W3C, February 2004\\
443
+ http://www.w3.org/TR/rdf-mt
444
+
445
+ \bibitem {opened}
446
+ Jay, Dru:
447
+ Three Proposals for Open Publishing --- Towards a transparent, collaborative
448
+ editorial framework, 2002\\
449
+ http://dru.ca/imc/open\_pub.html
450
+
451
+ \bibitem {fdnc}
452
+ Talbott, Stephen L.:
453
+ The Future Does Not Compute. O'Reilly \& Associates, 1995\\
454
+ http://www.oreilly.com/\homedir{}stevet/fdnc/
455
+
456
+ \bibitem {active2}
457
+ Warren, Mike:
458
+ Active2 Design. Indymedia, 2002.\\
459
+ http://docs.indymedia.org/view/Devel/DesignDocument
460
+
461
+ \end{thebibliography}
462
+ \end{document}