hugegraph-llm/src/hugegraph_llm/config/config.py - incubator-hugegraph-ai - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.


 import os
 from dataclasses import dataclass
 from typing import Optional

 import yaml
 from dotenv import dotenv_values, set_key

 from hugegraph_llm.config.config_data import ConfigData, PromptData
 from hugegraph_llm.utils.log import log

 dir_name = os.path.dirname
 package_path = dir_name(dir_name(dir_name(dir_name(os.path.abspath(__file__)))))
 env_path = os.path.join(package_path, ".env")
 F_NAME = "config_prompt.yaml"
 yaml_file_path = os.path.join(package_path, f"src/hugegraph_llm/resources/demo/{F_NAME}")


 def read_dotenv() -> dict[str, Optional[str]]:
     """Read a .env file in the given root path."""
     env_config = dotenv_values(f"{env_path}")
     log.info("Loading %s successfully!", env_path)
     for key, value in env_config.items():
         if key not in os.environ:
             os.environ[key] = value or "" # upper
     return env_config


 @dataclass
 class Config(ConfigData):

     def from_env(self):
         if os.path.exists(env_path):
             env_config = read_dotenv()
             for key, value in env_config.items():
                 if key.lower() in self.__annotations__ and value:
                     if self.__annotations__[key.lower()] in [int, Optional[int]]:
                         value = int(value)
                     setattr(self, key.lower(), value)
         else:
             self.generate_env()

     def generate_env(self):
         if os.path.exists(env_path):
             log.info("%s already exists, do you want to override with the default configuration? (y/n)", env_path)
             update = input()
             if update.lower() != "y":
                 return
             self.update_env()
         else:
             config_dict = {}
             for k, v in self.__dict__.items():
                 config_dict[k.upper()] = v
             with open(env_path, "w", encoding="utf-8") as f:
                 for k, v in config_dict.items():
                     if v is None:
                         f.write(f"{k}=\n")
                     else:
                         f.write(f"{k}={v}\n")
             log.info("Generate %s successfully!", env_path)


     def check_env(self):
         config_dict = {}
         for k, v in self.__dict__.items():
             config_dict[k.upper()] = str(v) if v else ""
         env_config = dotenv_values(f"{env_path}")
         for k, v in config_dict.items():
             if k in env_config:
                 continue
             log.info("Update %s: %s=%s", env_path, k, v)
             set_key(env_path, k, v, quote_mode="never")


     def update_env(self):
         config_dict = {}
         for k, v in self.__dict__.items():
             config_dict[k.upper()] = str(v) if v else ""
         env_config = dotenv_values(f"{env_path}")
         for k, v in config_dict.items():
             if k in env_config and env_config[k] == v:
                 continue
             log.info("Update %s: %s=%s", env_path, k, v)
             set_key(env_path, k, v, quote_mode="never")


 class PromptConfig(PromptData):

     def ensure_yaml_file_exists(self):
         if os.path.exists(yaml_file_path):
             log.info("Loading prompt file '%s' successfully.", F_NAME)
             with open(yaml_file_path, "r", encoding="utf-8") as file:
                 data = yaml.safe_load(file)
                 # Load existing values from the YAML file into the class attributes
                 for key, value in data.items():
                     setattr(self, key, value)
         else:
             self.generate_yaml_file()
             log.info("Prompt file '%s' doesn't exist, create it.", yaml_file_path)


     def save_to_yaml(self):
         indented_schema = "\n".join([f"  {line}" for line in self.graph_schema.splitlines()])
         indented_example_prompt = "\n".join([f"    {line}" for line in self.extract_graph_prompt.splitlines()])
         indented_question = "\n".join([f"    {line}" for line in self.default_question.splitlines()])
         indented_custom_related_information = (
             "\n".join([f"    {line}" for line in self.custom_rerank_info.splitlines()])
         )
         indented_default_answer_template = "\n".join([f"    {line}" for line in self.answer_prompt.splitlines()])
         indented_keywords_extract_template = (
             "\n".join([f"    {line}" for line in self.keywords_extract_prompt.splitlines()])
         )

         # This can be extended to add storage fields according to the data needs to be stored
         yaml_content = f"""graph_schema: |
 {indented_schema}

 extract_graph_prompt: |
 {indented_example_prompt}

 default_question: |
 {indented_question}

 custom_rerank_info: |
 {indented_custom_related_information}

 answer_prompt: |
 {indented_default_answer_template}

 keywords_extract_prompt: |
 {indented_keywords_extract_template}

 """
         with open(yaml_file_path, "w", encoding="utf-8") as file:
             file.write(yaml_content)

     def generate_yaml_file(self):
         if os.path.exists(yaml_file_path):
             log.info("%s already exists, do you want to override with the default configuration? (y/n)", yaml_file_path)
             update = input()
             if update.lower() != "y":
                 return
             self.save_to_yaml()
         else:
             self.save_to_yaml()
             log.info("Prompt file '%s' doesn't exist, create it.", yaml_file_path)

     def update_yaml_file(self):
         self.save_to_yaml()
         log.info("Prompt file '%s' updated successfully.", F_NAME)
	# Licensed to the Apache Software Foundation (ASF) under one
	# or more contributor license agreements. See the NOTICE file
	# distributed with this work for additional information
	# regarding copyright ownership. The ASF licenses this file
	# to you under the Apache License, Version 2.0 (the
	# "License"); you may not use this file except in compliance
	# with the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing,
	# software distributed under the License is distributed on an
	# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	# KIND, either express or implied. See the License for the
	# specific language governing permissions and limitations
	# under the License.


	import os
	from dataclasses import dataclass
	from typing import Optional

	import yaml
	from dotenv import dotenv_values, set_key

	from hugegraph_llm.config.config_data import ConfigData, PromptData
	from hugegraph_llm.utils.log import log

	dir_name = os.path.dirname
	package_path = dir_name(dir_name(dir_name(dir_name(os.path.abspath(__file__)))))
	env_path = os.path.join(package_path, ".env")
	F_NAME = "config_prompt.yaml"
	yaml_file_path = os.path.join(package_path, f"src/hugegraph_llm/resources/demo/{F_NAME}")


	def read_dotenv() -> dict[str, Optional[str]]:
	"""Read a .env file in the given root path."""
	env_config = dotenv_values(f"{env_path}")
	log.info("Loading %s successfully!", env_path)
	for key, value in env_config.items():
	if key not in os.environ:
	os.environ[key] = value or "" # upper
	return env_config


	@dataclass
	class Config(ConfigData):

	def from_env(self):
	if os.path.exists(env_path):
	env_config = read_dotenv()
	for key, value in env_config.items():
	if key.lower() in self.__annotations__ and value:
	if self.__annotations__[key.lower()] in [int, Optional[int]]:
	value = int(value)
	setattr(self, key.lower(), value)
	else:
	self.generate_env()

	def generate_env(self):
	if os.path.exists(env_path):
	log.info("%s already exists, do you want to override with the default configuration? (y/n)", env_path)
	update = input()
	if update.lower() != "y":
	return
	self.update_env()
	else:
	config_dict = {}
	for k, v in self.__dict__.items():
	config_dict[k.upper()] = v
	with open(env_path, "w", encoding="utf-8") as f:
	for k, v in config_dict.items():
	if v is None:
	f.write(f"{k}=\n")
	else:
	f.write(f"{k}={v}\n")
	log.info("Generate %s successfully!", env_path)


	def check_env(self):
	config_dict = {}
	for k, v in self.__dict__.items():
	config_dict[k.upper()] = str(v) if v else ""
	env_config = dotenv_values(f"{env_path}")
	for k, v in config_dict.items():
	if k in env_config:
	continue
	log.info("Update %s: %s=%s", env_path, k, v)
	set_key(env_path, k, v, quote_mode="never")


	def update_env(self):
	config_dict = {}
	for k, v in self.__dict__.items():
	config_dict[k.upper()] = str(v) if v else ""
	env_config = dotenv_values(f"{env_path}")
	for k, v in config_dict.items():
	if k in env_config and env_config[k] == v:
	continue
	log.info("Update %s: %s=%s", env_path, k, v)
	set_key(env_path, k, v, quote_mode="never")


	class PromptConfig(PromptData):

	def ensure_yaml_file_exists(self):
	if os.path.exists(yaml_file_path):
	log.info("Loading prompt file '%s' successfully.", F_NAME)
	with open(yaml_file_path, "r", encoding="utf-8") as file:
	data = yaml.safe_load(file)
	# Load existing values from the YAML file into the class attributes
	for key, value in data.items():
	setattr(self, key, value)
	else:
	self.generate_yaml_file()
	log.info("Prompt file '%s' doesn't exist, create it.", yaml_file_path)


	def save_to_yaml(self):
	indented_schema = "\n".join([f" {line}" for line in self.graph_schema.splitlines()])
	indented_example_prompt = "\n".join([f" {line}" for line in self.extract_graph_prompt.splitlines()])
	indented_question = "\n".join([f" {line}" for line in self.default_question.splitlines()])
	indented_custom_related_information = (
	"\n".join([f" {line}" for line in self.custom_rerank_info.splitlines()])
	)
	indented_default_answer_template = "\n".join([f" {line}" for line in self.answer_prompt.splitlines()])
	indented_keywords_extract_template = (
	"\n".join([f" {line}" for line in self.keywords_extract_prompt.splitlines()])
	)

	# This can be extended to add storage fields according to the data needs to be stored
	yaml_content = f"""graph_schema: \|
	{indented_schema}

	extract_graph_prompt: \|
	{indented_example_prompt}

	default_question: \|
	{indented_question}

	custom_rerank_info: \|
	{indented_custom_related_information}

	answer_prompt: \|
	{indented_default_answer_template}

	keywords_extract_prompt: \|
	{indented_keywords_extract_template}

	"""
	with open(yaml_file_path, "w", encoding="utf-8") as file:
	file.write(yaml_content)

	def generate_yaml_file(self):
	if os.path.exists(yaml_file_path):
	log.info("%s already exists, do you want to override with the default configuration? (y/n)", yaml_file_path)
	update = input()
	if update.lower() != "y":
	return
	self.save_to_yaml()
	else:
	self.save_to_yaml()
	log.info("Prompt file '%s' doesn't exist, create it.", yaml_file_path)

	def update_yaml_file(self):
	self.save_to_yaml()
	log.info("Prompt file '%s' updated successfully.", F_NAME)