本文整理汇总了Python中whoosh.compat.u函数的典型用法代码示例。如果您正苦于以下问题:Python u函数的具体用法?Python u怎么用?Python u使用的例子?那么恭喜您, 这里精选的函数代码示例或许可以为您提供帮助。
在下文中一共展示了u函数的20个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于我们的系统推荐出更棒的Python代码示例。
示例1: test_phrase_andmaybe
def test_phrase_andmaybe():
qp = default.QueryParser("f", None)
q = qp.parse(u('Dahmen ANDMAYBE "Besov Spaces"'))
assert isinstance(q, query.AndMaybe)
assert q[0] == query.Term("f", u("Dahmen"))
assert q[1] == query.Phrase("f", [u("Besov"), u("Spaces")])
开发者ID:gsadikin,项目名称:whoosh,代码行数:7,代码来源:test_parsing.py
示例2: test_deleteall
def test_deleteall():
schema = fields.Schema(text=fields.TEXT)
with TempIndex(schema, "deleteall") as ix:
w = ix.writer()
domain = u("alfa bravo charlie delta echo").split()
for i, ls in enumerate(permutations(domain)):
w.add_document(text=u(" ").join(ls))
if not i % 10:
w.commit()
w = ix.writer()
w.commit()
# This is just a test, don't use this method to delete all docs IRL!
doccount = ix.doc_count_all()
w = ix.writer()
for docnum in xrange(doccount):
w.delete_document(docnum)
w.commit()
with ix.searcher() as s:
r = s.search(query.Or([query.Term("text", u("alfa")),
query.Term("text", u("bravo"))]))
assert len(r) == 0
ix.optimize()
assert ix.doc_count_all() == 0
with ix.reader() as r:
assert list(r) == []
开发者ID:pombredanne,项目名称:whoosh,代码行数:29,代码来源:test_indexing.py
示例3: __unicode__
def __unicode__(self):
r = u("(")
r += (self.JOINT).join([text_type(s) for s in self.subqueries])
r += u(")")
if self.minmatch:
r += u(">%s") % self.minmatch
return r
开发者ID:Apophus,项目名称:microblog,代码行数:7,代码来源:compound.py
示例4: test_boolean
def test_boolean():
schema = fields.Schema(id=fields.ID(stored=True),
done=fields.BOOLEAN(stored=True))
ix = RamStorage().create_index(schema)
w = ix.writer()
w.add_document(id=u("a"), done=True)
w.add_document(id=u("b"), done=False)
w.add_document(id=u("c"), done=True)
w.add_document(id=u("d"), done=False)
w.add_document(id=u("e"), done=True)
w.commit()
with ix.searcher() as s:
qp = qparser.QueryParser("id", schema)
r = s.search(qp.parse("done:true"))
assert sorted([d["id"] for d in r]) == ["a", "c", "e"]
assert all(d["done"] for d in r)
r = s.search(qp.parse("done:yes"))
assert sorted([d["id"] for d in r]) == ["a", "c", "e"]
assert all(d["done"] for d in r)
q = qp.parse("done:false")
assert q.__class__ == query.Term
assert q.text is False
assert schema["done"].to_bytes(False) == b("f")
r = s.search(q)
assert sorted([d["id"] for d in r]) == ["b", "d"]
assert not any(d["done"] for d in r)
r = s.search(qp.parse("done:no"))
assert sorted([d["id"] for d in r]) == ["b", "d"]
assert not any(d["done"] for d in r)
开发者ID:JunjieHu,项目名称:dl,代码行数:35,代码来源:test_fields.py
示例5: test_colonspace
def test_colonspace():
s = fields.Schema(content=fields.TEXT, url=fields.ID)
qp = default.QueryParser("content", s)
q = qp.parse(u("url:test"))
assert_equal(q.__class__, query.Term)
assert_equal(q.fieldname, "url")
assert_equal(q.text, "test")
q = qp.parse(u("url: test"))
assert_equal(q.__class__, query.And)
assert_equal(q[0].__class__, query.Term)
assert_equal(q[1].__class__, query.Term)
assert_equal(q[0].fieldname, "content")
assert_equal(q[1].fieldname, "content")
assert_equal(q[0].text, "url")
assert_equal(q[1].text, "test")
q = qp.parse(u("url:"))
assert_equal(q.__class__, query.Term)
assert_equal(q.fieldname, "content")
assert_equal(q.text, "url")
s = fields.Schema(foo=fields.KEYWORD)
qp = default.QueryParser("foo", s)
q = qp.parse(u("blah:"))
assert_equal(q.__class__, query.Term)
assert_equal(q.fieldname, "foo")
assert_equal(q.text, "blah:")
开发者ID:ChimmyTee,项目名称:oh-mainline,代码行数:28,代码来源:test_parsing.py
示例6: test_suggest_prefix
def test_suggest_prefix():
domain = ("Shoot To Kill",
"Bloom, Split and Deviate",
"Rankle the Seas and the Skies",
"Lightning Flash Flame Shell",
"Flower Wind Rage and Flower God Roar, Heavenly Wind Rage and "
"Heavenly Demon Sneer",
"All Waves, Rise now and Become my Shield, Lightning, Strike "
"now and Become my Blade",
"Cry, Raise Your Head, Rain Without end",
"Sting All Enemies To Death",
"Reduce All Creation to Ash",
"Sit Upon the Frozen Heavens",
"Call forth the Twilight")
schema = fields.Schema(content=fields.TEXT(stored=True, spelling=True),
quick=fields.NGRAM(maxsize=10, stored=True))
with TempIndex(schema, "sugprefix") as ix:
with ix.writer() as w:
for item in domain:
content = u(item)
w.add_document(content=content, quick=content)
with ix.searcher() as s:
sugs = s.suggest("content", u("ra"), maxdist=2, prefix=2)
assert sugs == ['rage', 'rain']
sugs = s.suggest("content", "ra", maxdist=2, prefix=1)
assert sugs == ["rage", "rain", "roar"]
开发者ID:JunjieHu,项目名称:dl,代码行数:30,代码来源:test_spelling.py
示例7: test_requires
def test_requires():
a = Term("f", u("a"))
b = Term("f", u("b"))
assert_equal(And([a, b]).requires(), set([a, b]))
assert_equal(Or([a, b]).requires(), set())
assert_equal(AndMaybe(a, b).requires(), set([a]))
assert_equal(a.requires(), set([a]))
开发者ID:ChimmyTee,项目名称:oh-mainline,代码行数:7,代码来源:test_queries.py
示例8: test_sorting_function
def test_sorting_function():
schema = fields.Schema(id=fields.STORED, text=fields.TEXT(stored=True, vector=True))
ix = RamStorage().create_index(schema)
w = ix.writer()
domain = ("alfa", "bravo", "charlie")
count = 1
for w1 in domain:
for w2 in domain:
for w3 in domain:
for w4 in domain:
w.add_document(id=count, text=u(" ").join((w1, w2, w3, w4)))
count += 1
w.commit()
def fn(searcher, docnum):
v = dict(searcher.vector_as("frequency", docnum, "text"))
# Sort documents that have equal number of "alfa"
# and "bravo" first
return 0 - 1.0 / (abs(v.get("alfa", 0) - v.get("bravo", 0)) + 1.0)
fnfacet = sorting.FunctionFacet(fn)
with ix.searcher() as s:
q = query.And([query.Term("text", u("alfa")), query.Term("text", u("bravo"))])
results = s.search(q, sortedby=fnfacet)
r = [hit["text"] for hit in results]
for t in r[:10]:
tks = t.split()
assert tks.count("alfa") == tks.count("bravo")
开发者ID:JunjieHu,项目名称:dl,代码行数:29,代码来源:test_sorting.py
示例9: test_compound_sort
def test_compound_sort():
fspec = fields.KEYWORD(stored=True, sortable=True)
schema = fields.Schema(a=fspec, b=fspec, c=fspec)
ix = RamStorage().create_index(schema)
alist = u("alfa bravo alfa bravo alfa bravo alfa bravo alfa bravo").split()
blist = u("alfa bravo charlie alfa bravo charlie alfa bravo charlie alfa").split()
clist = u("alfa bravo charlie delta echo foxtrot golf hotel india juliet").split()
assert all(len(ls) == 10 for ls in (alist, blist, clist))
with ix.writer() as w:
for i in xrange(10):
w.add_document(a=alist[i], b=blist[i], c=clist[i])
with ix.searcher() as s:
q = query.Every()
sortedby = [sorting.FieldFacet("a"), sorting.FieldFacet("b", reverse=True), sorting.FieldFacet("c")]
r = s.search(q, sortedby=sortedby)
output = []
for hit in r:
output.append(" ".join((hit["a"], hit["b"], hit["c"])))
assert output == [
"alfa charlie charlie",
"alfa charlie india",
"alfa bravo echo",
"alfa alfa alfa",
"alfa alfa golf",
"bravo charlie foxtrot",
"bravo bravo bravo",
"bravo bravo hotel",
"bravo alfa delta",
"bravo alfa juliet",
]
开发者ID:JunjieHu,项目名称:dl,代码行数:35,代码来源:test_sorting.py
示例10: test_overlapping_lists
def test_overlapping_lists():
schema = fields.Schema(id=fields.STORED, tags=fields.KEYWORD)
ix = RamStorage().create_index(schema)
with ix.writer() as w:
w.add_document(id=0, tags=u("alfa bravo charlie"))
w.add_document(id=1, tags=u("bravo charlie delta"))
w.add_document(id=2, tags=u("charlie delta echo"))
w.add_document(id=3, tags=u("delta echo alfa"))
w.add_document(id=4, tags=u("echo alfa bravo"))
with ix.searcher() as s:
of = sorting.FieldFacet("tags", allow_overlap=True)
cat = of.categorizer(s)
assert not cat._use_vectors
r = s.search(query.Every(), groupedby={"tags": of})
assert r.groups("tags") == {
"alfa": [0, 3, 4],
"bravo": [0, 1, 4],
"charlie": [0, 1, 2],
"delta": [1, 2, 3],
"echo": [2, 3, 4],
}
fcts = sorting.Facets()
fcts.add_field("tags", allow_overlap=True)
r = s.search(query.Every(), groupedby=fcts)
assert r.groups("tags") == {
"alfa": [0, 3, 4],
"bravo": [0, 1, 4],
"charlie": [0, 1, 2],
"delta": [1, 2, 3],
"echo": [2, 3, 4],
}
开发者ID:JunjieHu,项目名称:dl,代码行数:34,代码来源:test_sorting.py
示例11: check
def check(method):
with TempIndex(get_schema()) as ix:
method(ix)
with ix.searcher() as s:
results = s.search(query.Every(), groupedby="tag")
groups = results.groups()
assert sorted(groups.items()) == [(u("one"), [0, 6]), (u("three"), [1, 3, 7, 8]), (u("two"), [2, 4, 5])]
开发者ID:JunjieHu,项目名称:dl,代码行数:7,代码来源:test_sorting.py
示例12: __unicode__
def __unicode__(self):
r = self.text + u("~")
if self.maxdist > 1:
r += u("%d") % self.maxdist
if self.boost != 1.0:
r += u("^%f") % self.boost
return r
开发者ID:intabeta,项目名称:inta,代码行数:7,代码来源:terms.py
示例13: test_requires
def test_requires():
a = Term("f", u("a"))
b = Term("f", u("b"))
assert And([a, b]).requires() == set([a, b])
assert Or([a, b]).requires() == set()
assert AndMaybe(a, b).requires() == set([a])
assert a.requires() == set([a])
开发者ID:pombredanne,项目名称:whoosh-clone,代码行数:7,代码来源:test_queries.py
示例14: test_keyterms
def test_keyterms():
ix = create_index()
with ix.searcher() as s:
docnum = s.document_number(path="/a")
keys = list(s.key_terms([docnum], "content", numterms=3))
assert ([t[0] for t in keys]
== [u("collision"), u("calculations"), u("damped")])
开发者ID:JunjieHu,项目名称:dl,代码行数:7,代码来源:test_classify.py
示例15: test_boost_phrase
def test_boost_phrase():
schema = fields.Schema(title=fields.TEXT(field_boost=5.0, stored=True), text=fields.TEXT)
ix = RamStorage().create_index(schema)
domain = u("alfa bravo charlie delta").split()
w = ix.writer()
for ls in permutations(domain):
t = u(" ").join(ls)
w.add_document(title=t, text=t)
w.commit()
q = Or([Term("title", u("alfa")), Term("title", u("bravo")), Phrase("text", [u("bravo"), u("charlie"), u("delta")])])
def boost_phrases(q):
if isinstance(q, Phrase):
q.boost *= 1000.0
return q
else:
return q.apply(boost_phrases)
q = boost_phrases(q)
with ix.searcher() as s:
r = s.search(q, limit=None)
for hit in r:
if "bravo charlie delta" in hit["title"]:
assert hit.score > 100.0
开发者ID:ChimmyTee,项目名称:oh-mainline,代码行数:25,代码来源:test_searching.py
示例16: test_hit_column
def test_hit_column():
# Not stored
schema = fields.Schema(text=fields.TEXT())
ix = RamStorage().create_index(schema)
with ix.writer() as w:
w.add_document(text=u("alfa bravo charlie"))
with ix.searcher() as s:
r = s.search(query.Term("text", "alfa"))
assert len(r) == 1
hit = r[0]
with pytest.raises(KeyError):
_ = hit["text"]
# With column
schema = fields.Schema(text=fields.TEXT(sortable=True))
ix = RamStorage().create_index(schema)
with ix.writer(codec=W3Codec()) as w:
w.add_document(text=u("alfa bravo charlie"))
with ix.searcher() as s:
r = s.search(query.Term("text", "alfa"))
assert len(r) == 1
hit = r[0]
assert hit["text"] == u("alfa bravo charlie")
开发者ID:pombredanne,项目名称:whoosh-clone,代码行数:25,代码来源:test_results.py
示例17: test_substitution
def test_substitution():
mf = analysis.RegexTokenizer(r"\S+") | analysis.SubstitutionFilter("-", "")
assert_equal([t.text for t in mf(u("one-two th-re-ee four"))],
["onetwo", "threee", "four"])
mf = analysis.RegexTokenizer(r"\S+") | analysis.SubstitutionFilter("([^=]*)=(.*)", r"\2=\1")
assert_equal([t.text for t in mf(u("a=b c=d ef"))], ["b=a", "d=c", "ef"])
开发者ID:ChimmyTee,项目名称:oh-mainline,代码行数:7,代码来源:test_analysis.py
示例18: test_term_inspection
def test_term_inspection():
schema = fields.Schema(title=fields.TEXT(stored=True),
content=fields.TEXT)
st = RamStorage()
ix = st.create_index(schema)
writer = ix.writer()
writer.add_document(title=u("My document"),
content=u("AA AA BB BB CC AA AA AA BB BB CC DD EE EE"))
writer.add_document(title=u("My other document"),
content=u("AA AB BB CC EE EE AX AX DD"))
writer.commit()
reader = ix.reader()
assert " ".join(reader.field_terms("content")) == "aa ab ax bb cc dd ee"
assert list(reader.expand_prefix("content", "a")) == [b('aa'), b('ab'), b('ax')]
assert set(reader.all_terms()) == set([('content', b('aa')), ('content', b('ab')),
('content', b('ax')), ('content', b('bb')),
('content', b('cc')), ('content', b('dd')),
('content', b('ee')), ('title', b('document')),
('title', b('my')), ('title', b('other'))])
# (text, doc_freq, index_freq)
assert _fstats(reader.iter_field("content")) == [(b('aa'), 2, 6), (b('ab'), 1, 1), (b('ax'), 1, 2),
(b('bb'), 2, 5), (b('cc'), 2, 3), (b('dd'), 2, 2),
(b('ee'), 2, 4)]
assert _fstats(reader.iter_field("content", prefix="c")) == [(b('cc'), 2, 3), (b('dd'), 2, 2), (b('ee'), 2, 4)]
assert list(reader.most_frequent_terms("content")) == [(6, b('aa')), (5, b('bb')), (4, b('ee')), (3, b('cc')), (2, b('dd'))]
assert list(reader.most_frequent_terms("content", prefix="a")) == [(6, b('aa')), (2, b('ax')), (1, b('ab'))]
assert list(reader.most_distinctive_terms("content", 3)) == [(1.3862943611198906, b('ax')), (0.6931471805599453, b('ab')), (0.0, b('ee'))]
开发者ID:JunjieHu,项目名称:dl,代码行数:28,代码来源:test_reading.py
示例19: __unicode__
def __unicode__(self):
r = u("%s:%s") % (self.fieldname, self.text) + u("~")
if self.maxdist > 1:
r += u("%d") % self.maxdist
if self.boost != 1.0:
r += u("^%f") % self.boost
return r
开发者ID:32footsteps,项目名称:SpecialCollectionsProject,代码行数:7,代码来源:terms.py
示例20: test_gtlt
def test_gtlt():
schema = fields.Schema(a=fields.KEYWORD, b=fields.NUMERIC,
c=fields.KEYWORD,
d=fields.NUMERIC(float), e=fields.DATETIME)
qp = qparser.QueryParser("a", schema)
qp.add_plugin(plugins.GtLtPlugin())
qp.add_plugin(dateparse.DateParserPlugin())
q = qp.parse(u("a:hello b:>100 c:<=z there"))
assert_equal(q.__class__, query.And)
assert_equal(len(q), 4)
assert_equal(q[0], query.Term("a", "hello"))
assert_equal(q[1], query.NumericRange("b", 100, None, startexcl=True))
assert_equal(q[2], query.TermRange("c", None, 'z'))
assert_equal(q[3], query.Term("a", "there"))
q = qp.parse(u("hello e:>'29 mar 2001' there"))
assert_equal(q.__class__, query.And)
assert_equal(len(q), 3)
assert_equal(q[0], query.Term("a", "hello"))
# As of this writing, date ranges don't support startexcl/endexcl
assert_equal(q[1], query.DateRange("e", datetime(2001, 3, 29, 0, 0), None))
assert_equal(q[2], query.Term("a", "there"))
q = qp.parse(u("a:> alfa c:<= bravo"))
assert_equal(text_type(q), "(a:a: AND a:alfa AND a:c: AND a:bravo)")
qp.remove_plugin_class(plugins.FieldsPlugin)
qp.remove_plugin_class(plugins.RangePlugin)
q = qp.parse(u("hello a:>500 there"))
assert_equal(text_type(q), "(a:hello AND a:a: AND a:500 AND a:there)")
开发者ID:ChimmyTee,项目名称:oh-mainline,代码行数:31,代码来源:test_parse_plugins.py
注:本文中的whoosh.compat.u函数示例由纯净天空整理自Github/MSDocs等源码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。 |
请发表评论