-
Notifications
You must be signed in to change notification settings - Fork 12
/
Copy pathConstTerm.py
145 lines (108 loc) · 3.54 KB
/
ConstTerm.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
"""Intern Semantic Web logical constants
We divide RDF/SWeLL terms into the following hierarchy:
Term
Constant
Symbol (i.e. URI, with or without #fragment)
StringLiteral (i.e. unicode character sequence)
IntegerLiteral (not in RDF '98)
XMLLiteral (@@TODO: not implemented)
BNode (i.e. existentially quantified variable)
(also used for things like lists)
Formula (i.e. nested formula; not in RDF '98)
This constant module covers only the constants, i.e.
the objects that can be shared accross stores/formulas/etc.
They are interned, meanwhile:
>>> x=Symbol("http://example/")
>>> y=Symbol("http://example/")
>>> x is y
1
>>> l=StringLiteral("abc")
>>> m=StringLiteral("abc")
>>> l is m
1
String literals are disjoint from symbols:
>>> n=StringLiteral("http://example/")
>>> x is n
0
NOTE: this relies on python2.2-isms, esp
Overriding the __new__ method
in
Unifying types and classes in Python 2.2
Python Version: 2.2bc1
Guido van Rossum
Tue, 09 Jul 2002 13:49:57 GMT
http://www.python.org/2.2/descrintro.html#__new__
"""
__version__ = '$Id$'
__credits__ = """
inspired by the node.py stuff from http://rdflib.net/
"""
class Symbol(str):
"""A symbol, or logical name, in the Semantic Web.
Don't try to use a relative URI reference as a symbol:
>>> bug=Symbol("../foo")
Traceback (most recent call last):
File "<string>", line 1, in ?
File "ConstTerm.py", line 51, in __new__
assert ':' in name, "must be absolute: %s" % name
AssertionError: must be absolute: ../foo
For now, at least, stick to US-ASCII characters in symbols:
>>> bug=Symbol(u"http://example/#D\u00fcrst")
Traceback (most recent call last):
File "<string>", line 1, in ?
File "ConstTerm.py", line 63, in __new__
sym = str.__new__(Symbol, name)
UnicodeError: ASCII encoding error: ordinal not in range(128)
"""
_seen = {}
def __new__(cls, name):
seen = Symbol._seen
try:
return seen[name]
except KeyError:
assert ':' in name, "must be absolute: %s" % name
sym = str.__new__(cls, name)
seen[name] = sym
return sym
class Namespace(object):
"""A collection of symbols with a common prefix
>>> RDF = Namespace('http://www.w3.org/1999/02/22-rdf-syntax-ns#')
>>> RDF['type']
'http://www.w3.org/1999/02/22-rdf-syntax-ns#type'
>>> RDF['type'] is RDF['type']
1
"""
def __init__(self, name):
assert ':' in name, "must be absolute: %s" % name
self._name = name
self._seen = {}
def name(self):
return self._name
def __getitem__(self, lname):
"""get the lname Symbol in this namespace.
lname -- an XML name (limited to URI characters)
Hmm... we keep another hash table of just the names
in this namespace... is this worthwhile?
"""
seen = self._seen
try:
return seen[lname]
except KeyError:
sym = Symbol(self._name + lname)
seen[lname] = sym
return sym
class StringLiteral(unicode):
_seen = {}
def __new__(cls, chars):
seen = StringLiteral._seen
try:
return seen[chars]
except KeyError:
lit = unicode.__new__(cls, chars)
seen[chars] = lit
return lit
def _test():
import doctest, ConstTerm
return doctest.testmod(ConstTerm)
if __name__ == "__main__":
_test()