Skip to content
This repository was archived by the owner on May 27, 2025. It is now read-only.

Commit 57e8664

Browse files
committed
refactor AzureClientManager code and update pytests
1 parent ba883dc commit 57e8664

27 files changed

+358
-59
lines changed

backend/manage-indexing-jobs.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,9 +17,9 @@
1717
config,
1818
)
1919

20-
from src.api.azure_clients import AzureClientManager
2120
from src.logger.load_logger import load_pipeline_logger
2221
from src.typing.pipeline import PipelineJobState
22+
from src.utils.azure_clients import AzureClientManager
2323
from src.utils.common import sanitize_name
2424
from src.utils.pipeline import PipelineJob
2525

backend/src/api/data.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,12 +13,12 @@
1313
UploadFile,
1414
)
1515

16-
from src.api.azure_clients import AzureClientManager
1716
from src.logger.load_logger import load_pipeline_logger
1817
from src.typing.models import (
1918
BaseResponse,
2019
StorageNameList,
2120
)
21+
from src.utils.azure_clients import AzureClientManager
2222
from src.utils.common import (
2323
delete_blob_container,
2424
delete_cosmos_container_item,

backend/src/api/graph.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,8 @@
77
)
88
from fastapi.responses import StreamingResponse
99

10-
from src.api.azure_clients import AzureClientManager
1110
from src.logger.load_logger import load_pipeline_logger
11+
from src.utils.azure_clients import AzureClientManager
1212
from src.utils.common import (
1313
sanitize_name,
1414
validate_index_file_exist,

backend/src/api/index.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,14 +18,14 @@
1818
config as kubernetes_config,
1919
)
2020

21-
from src.api.azure_clients import AzureClientManager
2221
from src.logger.load_logger import load_pipeline_logger
2322
from src.typing.models import (
2423
BaseResponse,
2524
IndexNameList,
2625
IndexStatusResponse,
2726
)
2827
from src.typing.pipeline import PipelineJobState
28+
from src.utils.azure_clients import AzureClientManager
2929
from src.utils.common import (
3030
delete_blob_container,
3131
sanitize_name,

backend/src/api/prompt_tuning.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,8 +13,8 @@
1313
)
1414
from graphrag.config.create_graphrag_config import create_graphrag_config
1515

16-
from src.api.azure_clients import AzureClientManager
1716
from src.logger.load_logger import load_pipeline_logger
17+
from src.utils.azure_clients import AzureClientManager
1818
from src.utils.common import sanitize_name
1919

2020
prompt_tuning_route = APIRouter(prefix="/index/config", tags=["Index Configuration"])

backend/src/api/query.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,13 +25,13 @@
2525
VectorStoreSearchResult,
2626
)
2727

28-
from src.api.azure_clients import AzureClientManager
2928
from src.logger.load_logger import load_pipeline_logger
3029
from src.typing.models import (
3130
GraphRequest,
3231
GraphResponse,
3332
)
3433
from src.typing.pipeline import PipelineJobState
34+
from src.utils.azure_clients import AzureClientManager
3535
from src.utils.common import (
3636
get_df,
3737
sanitize_name,

backend/src/api/query_streaming.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,10 +21,10 @@
2121
)
2222
from graphrag.config import create_graphrag_config
2323

24-
from src.api.azure_clients import AzureClientManager
2524
from src.api.query import _is_index_complete
2625
from src.logger.load_logger import load_pipeline_logger
2726
from src.typing.models import GraphRequest
27+
from src.utils.azure_clients import AzureClientManager
2828
from src.utils.common import (
2929
get_df,
3030
sanitize_name,

backend/src/api/source.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -29,8 +29,8 @@
2929
COVARIATES_TABLE = "output/create_final_covariates.parquet"
3030
ENTITY_EMBEDDING_TABLE = "output/create_final_entities.parquet"
3131
RELATIONSHIPS_TABLE = "output/create_final_relationships.parquet"
32-
TEXT_UNITS_TABLE = "output/create_base_text_units.parquet"
33-
DOCUMENTS_TABLE = "output/create_base_documents.parquet"
32+
TEXT_UNITS_TABLE = "output/create_final_text_units.parquet"
33+
DOCUMENTS_TABLE = "output/create_final_documents.parquet"
3434

3535

3636
@source_route.get(
@@ -39,7 +39,7 @@
3939
response_model=ReportResponse,
4040
responses={200: {"model": ReportResponse}},
4141
)
42-
async def get_report_info(index_name: str, report_id: str):
42+
async def get_report_info(index_name: str, report_id: int):
4343
# check for existence of file the query relies on to validate the index is complete
4444
sanitized_index_name = sanitize_name(index_name)
4545
validate_index_file_exist(sanitized_index_name, COMMUNITY_REPORT_TABLE)
@@ -49,15 +49,15 @@ async def get_report_info(index_name: str, report_id: str):
4949
storage_options=pandas_storage_options(),
5050
)
5151
# check if report_id exists in the index
52-
if not report_table["community"].isin([report_id]).any():
52+
if not report_table["human_readable_id"].isin([report_id]).any():
5353
raise ValueError(f"Report '{report_id}' not found in index '{index_name}'.")
5454
# check if multiple reports with the same id exist (should not happen)
55-
if len(report_table.loc[report_table["community"] == report_id]) > 1:
55+
if len(report_table.loc[report_table["human_readable_id"] == report_id]) > 1:
5656
raise ValueError(
5757
f"Multiple reports with id '{report_id}' found in index '{index_name}'."
5858
)
5959
report_content = report_table.loc[
60-
report_table["community"] == report_id, "full_content"
60+
report_table["human_readable_id"] == report_id, "full_content_json"
6161
].to_numpy()[0]
6262
return ReportResponse(text=report_content)
6363
except Exception:
@@ -97,7 +97,7 @@ async def get_chunk_info(index_name: str, text_unit_id: str):
9797
text_units = text_units.explode("document_ids")
9898

9999
# verify that text_unit_id exists in the index
100-
if not text_units["chunk_id"].isin([text_unit_id]).any():
100+
if not text_units["human_readable_id"].isin([text_unit_id]).any():
101101
raise ValueError(
102102
f"Text unit '{text_unit_id}' not found in index '{index_name}'."
103103
)

backend/src/indexer/indexer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,12 +13,12 @@
1313
from graphrag.config.create_graphrag_config import create_graphrag_config
1414
from graphrag.index.create_pipeline_config import create_pipeline_config
1515

16-
from src.api.azure_clients import AzureClientManager
1716
from src.logger import (
1817
PipelineJobUpdater,
1918
load_pipeline_logger,
2019
)
2120
from src.typing.pipeline import PipelineJobState
21+
from src.utils.azure_clients import AzureClientManager
2222
from src.utils.common import sanitize_name
2323
from src.utils.pipeline import PipelineJob
2424

backend/src/logger/__init__.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,6 @@
66
)
77
from src.logger.console_workflow_callbacks import ConsoleWorkflowCallbacks
88
from src.logger.load_logger import load_pipeline_logger
9-
from src.logger.logger_singleton import LoggerSingleton
109
from src.logger.pipeline_job_updater import PipelineJobUpdater
1110
from src.logger.typing import (
1211
Logger,
@@ -18,7 +17,6 @@
1817
"Logger",
1918
"ApplicationInsightsWorkflowCallbacks",
2019
"ConsoleWorkflowCallbacks",
21-
"LoggerSingleton",
2220
"PipelineAppInsightsReportingConfig",
2321
"PipelineJobUpdater",
2422
"PipelineReportingConfigTypes",

0 commit comments

Comments
 (0)