ind*_*nds 5 python django elasticsearch elasticsearch-dsl
我在 Django 项目中使用 elasticsearch-dsl 库来索引数据,然后查询回来。
我有以下型号:
class Comments(models.Model):
comment_id = models.CharField(max_length=1000,blank=True,null=True)
user_post_id = models.ForeignKey('UserPosts',null=True)
score = models.CharField(max_length=1000,blank=True,null=True)
text = models.TextField(blank=True,null=True)
creation_date = models.CharField(max_length=1000,blank=True,null=True)
def __unicode__(self):
return self.comment_id
def indexing(self):
obj = CommentsIndex(
meta={'id': self.id},
comment_id=self.comment_id,
user_post_id=self.user_post_id,
score=self.score,
text=self.text,
creation_date=self.creation_date,
)
obj.save(index='comments-index')
return obj.to_dict(include_meta=True)
class UserPosts(models.Model):
user_post_id = models.CharField(max_length = 1000 , blank = True , null = True)
user_post_type_id = models.CharField(max_length = 1000 , blank = True , null = True)
accepted_answer_id = models.CharField(max_length = 1000 , blank = True , null = True)
creation_date = models.CharField(max_length=1000,blank = True , null = True)
score = models.CharField(max_length = 1000 , blank = True , null = True)
view_count = models.CharField(max_length = 1000 , blank = True , null = True)
body = models.TextField( blank = True , null = True)
last_editor_user_id = models.CharField(max_length = 1000 , blank = True , null = True)
last_editor_display_name = models.CharField(max_length = 1000 , blank = True , null = True)
last_edit_date = models.CharField(max_length = 1000 , blank = True , null = True)
last_activity_date =models.CharField(max_length = 1000 , blank = True , null = True)
title = models.CharField(max_length = 1000 , blank = True , null = True)
tags = models.CharField(max_length = 1000 , blank = True , null = True)
answer_count = models.CharField(max_length = 1000 , blank = True , null = True)
comment_count = models.CharField(max_length = 1000 , blank = True , null = True)
favorite_count = models.CharField(max_length = 1000 , blank = True , null = True)
owner_user_id = models.ForeignKey(StackOverFlowUsers,null=True)
parent_id = models.CharField(max_length = 1000 , blank = True , null = True)
def __unicode__(self):
return self.user_post_id
Run Code Online (Sandbox Code Playgroud)
这就是我将模型包装在文档类型中的方式:
class UserPostsIndex(InnerDoc):
user_post_id = Text()
score = Text()
class CommentsIndex(DocType):
comment_id = Text()
user_post_id = Nested(UserPostsIndex)
score = Text()
text = Text()
creation_date = Text()
Run Code Online (Sandbox Code Playgroud)
当我调用以下函数时,我的数据将被索引到弹性搜索中:
def bulk_indexing():
CommentsIndex.init(index='comments-index')
es = Elasticsearch()
bulk(client=es, actions=(b.indexing() for b in models.Comments.objects.all().iterator()))
Run Code Online (Sandbox Code Playgroud)
我尝试测试是否可以查询数据的方法是使用搜索功能,如下所示:
def search(text):
s = Search(index="comments-index").filter("term", score= text)
response = s.execute()
return response
Run Code Online (Sandbox Code Playgroud)
我无法查询嵌套对象,并尝试了很多不同的方法但失败了。如何获取嵌套对象字段,例如 user_post_id.score?
像这样的东西应该有效:
CommentsIndex.search().query('nested', path='user_post_id', query=Q('range', eser_post_id__score={'gt': 42}))
Run Code Online (Sandbox Code Playgroud)
| 归档时间: |
|
| 查看次数: |
9106 次 |
| 最近记录: |