123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292 |
- import datetime
- import logging
- import random
- import string
- import time
- import click
- from flask import current_app
- from werkzeug.exceptions import NotFound
- from core.index.index import IndexBuilder
- from libs.password import password_pattern, valid_password, hash_password
- from libs.helper import email as email_validate
- from extensions.ext_database import db
- from libs.rsa import generate_key_pair
- from models.account import InvitationCode, Tenant
- from models.dataset import Dataset, DatasetQuery, Document, DocumentSegment
- from models.model import Account
- import secrets
- import base64
- from models.provider import Provider, ProviderName
- from services.provider_service import ProviderService
- @click.command('reset-password', help='Reset the account password.')
- @click.option('--email', prompt=True, help='The email address of the account whose password you need to reset')
- @click.option('--new-password', prompt=True, help='the new password.')
- @click.option('--password-confirm', prompt=True, help='the new password confirm.')
- def reset_password(email, new_password, password_confirm):
- if str(new_password).strip() != str(password_confirm).strip():
- click.echo(click.style('sorry. The two passwords do not match.', fg='red'))
- return
- account = db.session.query(Account). \
- filter(Account.email == email). \
- one_or_none()
- if not account:
- click.echo(click.style('sorry. the account: [{}] not exist .'.format(email), fg='red'))
- return
- try:
- valid_password(new_password)
- except:
- click.echo(
- click.style('sorry. The passwords must match {} '.format(password_pattern), fg='red'))
- return
- # generate password salt
- salt = secrets.token_bytes(16)
- base64_salt = base64.b64encode(salt).decode()
- # encrypt password with salt
- password_hashed = hash_password(new_password, salt)
- base64_password_hashed = base64.b64encode(password_hashed).decode()
- account.password = base64_password_hashed
- account.password_salt = base64_salt
- db.session.commit()
- click.echo(click.style('Congratulations!, password has been reset.', fg='green'))
- @click.command('reset-email', help='Reset the account email.')
- @click.option('--email', prompt=True, help='The old email address of the account whose email you need to reset')
- @click.option('--new-email', prompt=True, help='the new email.')
- @click.option('--email-confirm', prompt=True, help='the new email confirm.')
- def reset_email(email, new_email, email_confirm):
- if str(new_email).strip() != str(email_confirm).strip():
- click.echo(click.style('Sorry, new email and confirm email do not match.', fg='red'))
- return
- account = db.session.query(Account). \
- filter(Account.email == email). \
- one_or_none()
- if not account:
- click.echo(click.style('sorry. the account: [{}] not exist .'.format(email), fg='red'))
- return
- try:
- email_validate(new_email)
- except:
- click.echo(
- click.style('sorry. {} is not a valid email. '.format(email), fg='red'))
- return
- account.email = new_email
- db.session.commit()
- click.echo(click.style('Congratulations!, email has been reset.', fg='green'))
- @click.command('reset-encrypt-key-pair', help='Reset the asymmetric key pair of workspace for encrypt LLM credentials. '
- 'After the reset, all LLM credentials will become invalid, '
- 'requiring re-entry.'
- 'Only support SELF_HOSTED mode.')
- @click.confirmation_option(prompt=click.style('Are you sure you want to reset encrypt key pair?'
- ' this operation cannot be rolled back!', fg='red'))
- def reset_encrypt_key_pair():
- if current_app.config['EDITION'] != 'SELF_HOSTED':
- click.echo(click.style('Sorry, only support SELF_HOSTED mode.', fg='red'))
- return
- tenant = db.session.query(Tenant).first()
- if not tenant:
- click.echo(click.style('Sorry, no workspace found. Please enter /install to initialize.', fg='red'))
- return
- tenant.encrypt_public_key = generate_key_pair(tenant.id)
- db.session.query(Provider).filter(Provider.provider_type == 'custom').delete()
- db.session.commit()
- click.echo(click.style('Congratulations! '
- 'the asymmetric key pair of workspace {} has been reset.'.format(tenant.id), fg='green'))
- @click.command('generate-invitation-codes', help='Generate invitation codes.')
- @click.option('--batch', help='The batch of invitation codes.')
- @click.option('--count', prompt=True, help='Invitation codes count.')
- def generate_invitation_codes(batch, count):
- if not batch:
- now = datetime.datetime.now()
- batch = now.strftime('%Y%m%d%H%M%S')
- if not count or int(count) <= 0:
- click.echo(click.style('sorry. the count must be greater than 0.', fg='red'))
- return
- count = int(count)
- click.echo('Start generate {} invitation codes for batch {}.'.format(count, batch))
- codes = ''
- for i in range(count):
- code = generate_invitation_code()
- invitation_code = InvitationCode(
- code=code,
- batch=batch
- )
- db.session.add(invitation_code)
- click.echo(code)
- codes += code + "\n"
- db.session.commit()
- filename = 'storage/invitation-codes-{}.txt'.format(batch)
- with open(filename, 'w') as f:
- f.write(codes)
- click.echo(click.style(
- 'Congratulations! Generated {} invitation codes for batch {} and saved to the file \'{}\''.format(count, batch,
- filename),
- fg='green'))
- def generate_invitation_code():
- code = generate_upper_string()
- while db.session.query(InvitationCode).filter(InvitationCode.code == code).count() > 0:
- code = generate_upper_string()
- return code
- def generate_upper_string():
- letters_digits = string.ascii_uppercase + string.digits
- result = ""
- for i in range(8):
- result += random.choice(letters_digits)
- return result
- @click.command('recreate-all-dataset-indexes', help='Recreate all dataset indexes.')
- def recreate_all_dataset_indexes():
- click.echo(click.style('Start recreate all dataset indexes.', fg='green'))
- recreate_count = 0
- page = 1
- while True:
- try:
- datasets = db.session.query(Dataset).filter(Dataset.indexing_technique == 'high_quality') \
- .order_by(Dataset.created_at.desc()).paginate(page=page, per_page=50)
- except NotFound:
- break
- page += 1
- for dataset in datasets:
- try:
- click.echo('Recreating dataset index: {}'.format(dataset.id))
- index = IndexBuilder.get_index(dataset, 'high_quality')
- if index and index._is_origin():
- index.recreate_dataset(dataset)
- recreate_count += 1
- else:
- click.echo('passed.')
- except Exception as e:
- click.echo(
- click.style('Recreate dataset index error: {} {}'.format(e.__class__.__name__, str(e)), fg='red'))
- continue
- click.echo(click.style('Congratulations! Recreate {} dataset indexes.'.format(recreate_count), fg='green'))
- @click.command('clean-unused-dataset-indexes', help='Clean unused dataset indexes.')
- def clean_unused_dataset_indexes():
- click.echo(click.style('Start clean unused dataset indexes.', fg='green'))
- clean_days = int(current_app.config.get('CLEAN_DAY_SETTING'))
- start_at = time.perf_counter()
- thirty_days_ago = datetime.datetime.now() - datetime.timedelta(days=clean_days)
- page = 1
- while True:
- try:
- datasets = db.session.query(Dataset).filter(Dataset.created_at < thirty_days_ago) \
- .order_by(Dataset.created_at.desc()).paginate(page=page, per_page=50)
- except NotFound:
- break
- page += 1
- for dataset in datasets:
- dataset_query = db.session.query(DatasetQuery).filter(
- DatasetQuery.created_at > thirty_days_ago,
- DatasetQuery.dataset_id == dataset.id
- ).all()
- if not dataset_query or len(dataset_query) == 0:
- documents = db.session.query(Document).filter(
- Document.dataset_id == dataset.id,
- Document.indexing_status == 'completed',
- Document.enabled == True,
- Document.archived == False,
- Document.updated_at > thirty_days_ago
- ).all()
- if not documents or len(documents) == 0:
- try:
- # remove index
- vector_index = IndexBuilder.get_index(dataset, 'high_quality')
- kw_index = IndexBuilder.get_index(dataset, 'economy')
- # delete from vector index
- if vector_index:
- vector_index.delete()
- kw_index.delete()
- # update document
- update_params = {
- Document.enabled: False
- }
- Document.query.filter_by(dataset_id=dataset.id).update(update_params)
- db.session.commit()
- click.echo(click.style('Cleaned unused dataset {} from db success!'.format(dataset.id),
- fg='green'))
- except Exception as e:
- click.echo(
- click.style('clean dataset index error: {} {}'.format(e.__class__.__name__, str(e)),
- fg='red'))
- end_at = time.perf_counter()
- click.echo(click.style('Cleaned unused dataset from db success latency: {}'.format(end_at - start_at), fg='green'))
- @click.command('sync-anthropic-hosted-providers', help='Sync anthropic hosted providers.')
- def sync_anthropic_hosted_providers():
- click.echo(click.style('Start sync anthropic hosted providers.', fg='green'))
- count = 0
- page = 1
- while True:
- try:
- tenants = db.session.query(Tenant).order_by(Tenant.created_at.desc()).paginate(page=page, per_page=50)
- except NotFound:
- break
- page += 1
- for tenant in tenants:
- try:
- click.echo('Syncing tenant anthropic hosted provider: {}'.format(tenant.id))
- ProviderService.create_system_provider(
- tenant,
- ProviderName.ANTHROPIC.value,
- current_app.config['ANTHROPIC_HOSTED_QUOTA_LIMIT'],
- True
- )
- count += 1
- except Exception as e:
- click.echo(click.style(
- 'Sync tenant anthropic hosted provider error: {} {}'.format(e.__class__.__name__, str(e)),
- fg='red'))
- continue
- click.echo(click.style('Congratulations! Synced {} anthropic hosted providers.'.format(count), fg='green'))
- def register_commands(app):
- app.cli.add_command(reset_password)
- app.cli.add_command(reset_email)
- app.cli.add_command(generate_invitation_codes)
- app.cli.add_command(reset_encrypt_key_pair)
- app.cli.add_command(recreate_all_dataset_indexes)
- app.cli.add_command(sync_anthropic_hosted_providers)
- app.cli.add_command(clean_unused_dataset_indexes)
|