Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
D
dify
Project
Project
Details
Activity
Releases
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ai-tech
dify
Commits
e148aad0
Commit
e148aad0
authored
Jul 19, 2023
by
jyong
Browse files
Options
Browse Files
Download
Plain Diff
Merge branch 'feat/clean-vector-dataset' into deploy/dev
parents
77f7131e
43aaac36
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
19 additions
and
23 deletions
+19
-23
commands.py
api/commands.py
+19
-23
No files found.
api/commands.py
View file @
e148aad0
...
@@ -221,31 +221,27 @@ def clean_unused_dataset_indexes():
...
@@ -221,31 +221,27 @@ def clean_unused_dataset_indexes():
Document
.
indexing_status
==
'completed'
,
Document
.
indexing_status
==
'completed'
,
Document
.
enabled
==
True
,
Document
.
enabled
==
True
,
Document
.
archived
==
False
,
Document
.
archived
==
False
,
Document
.
updated_at
<
thirty_days_ago
Document
.
updated_at
>
thirty_days_ago
)
.
all
()
)
.
all
()
if
documents
:
if
not
documents
and
len
(
documents
)
>
0
:
for
document
in
documents
:
try
:
click
.
style
(
'Start clean document segments from index: {}'
.
format
(
document
.
id
),
update_params
=
{
fg
=
'green'
)
Document
.
enabled
:
False
document
.
enabled
=
False
}
Document
.
query
.
filter_by
(
dataset_id
=
dataset
.
id
)
.
update
(
update_params
)
db
.
session
.
commit
()
db
.
session
.
commit
()
try
:
# remove index
# remove index
vector_index
=
IndexBuilder
.
get_index
(
dataset
,
'high_quality'
)
vector_index
=
IndexBuilder
.
get_index
(
dataset
,
'high_quality'
)
kw_index
=
IndexBuilder
.
get_index
(
dataset
,
'economy'
)
kw_index
=
IndexBuilder
.
get_index
(
dataset
,
'economy'
)
# delete from vector index
if
vector_index
:
# delete from vector index
vector_index
.
delete
()
if
vector_index
:
kw_index
.
delete
()
vector_index
.
delete_by_document_id
(
document
.
id
)
except
Exception
as
e
:
click
.
echo
(
# delete from keyword index
click
.
style
(
'clean dataset index error: {} {}'
.
format
(
e
.
__class__
.
__name__
,
str
(
e
)),
segments
=
db
.
session
.
query
(
DocumentSegment
)
.
filter
(
fg
=
'red'
))
DocumentSegment
.
document_id
==
document
.
id
)
.
all
()
index_node_ids
=
[
segment
.
index_node_id
for
segment
in
segments
]
if
index_node_ids
:
kw_index
.
delete_by_ids
(
index_node_ids
)
except
Exception
:
logging
.
exception
(
"clean document from index failed: {}"
.
format
(
document
.
id
))
end_at
=
time
.
perf_counter
()
end_at
=
time
.
perf_counter
()
click
.
echo
(
click
.
style
(
'Cleaned unused dataset from db success latency: {}'
.
format
(
end_at
-
start_at
),
fg
=
'green'
))
click
.
echo
(
click
.
style
(
'Cleaned unused dataset from db success latency: {}'
.
format
(
end_at
-
start_at
),
fg
=
'green'
))
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment