Files
DiunaBI/DiunaBI.Plugins.Morska/Processors/MorskaT1R3Processor.cs

476 lines
17 KiB
C#
Raw Normal View History

using System.Globalization;
using System.Text.RegularExpressions;
2025-11-05 20:50:25 +01:00
using DiunaBI.Domain.Entities;
using DiunaBI.Infrastructure.Data;
2025-12-02 21:24:37 +01:00
using DiunaBI.Infrastructure.Plugins;
2025-11-05 20:50:25 +01:00
using DiunaBI.Infrastructure.Services;
using Google.Apis.Sheets.v4;
using Google.Apis.Sheets.v4.Data;
using Microsoft.EntityFrameworkCore;
2025-06-02 18:53:25 +02:00
using Microsoft.Extensions.Logging;
namespace DiunaBI.Plugins.Morska.Processors;
2025-12-02 21:24:37 +01:00
public class MorskaT1R3Processor : BaseDataProcessor
2025-06-02 16:54:33 +02:00
{
2025-06-07 16:34:36 +02:00
public override string ProcessorType => "Morska.Process.T1.R3";
2025-06-02 16:54:33 +02:00
private readonly AppDbContext _db;
private readonly SpreadsheetsResource.ValuesResource _googleSheetValues;
2025-06-08 10:56:20 +02:00
private readonly ILogger<MorskaT1R3Processor> _logger;
2025-06-02 18:53:25 +02:00
2025-06-07 13:51:27 +02:00
// Configuration properties loaded from layer records
private int Year { get; set; }
private string? Source { get; set; }
2025-06-08 10:56:20 +02:00
public MorskaT1R3Processor(
2025-06-02 18:53:25 +02:00
AppDbContext db,
SpreadsheetsResource.ValuesResource googleSheetValues,
2025-06-08 10:56:20 +02:00
ILogger<MorskaT1R3Processor> logger)
2025-06-02 16:54:33 +02:00
{
_db = db;
_googleSheetValues = googleSheetValues;
2025-06-02 18:53:25 +02:00
_logger = logger;
2025-06-02 16:54:33 +02:00
}
2025-06-07 13:51:27 +02:00
2025-06-02 16:54:33 +02:00
public override void Process(Layer processWorker)
{
2025-06-07 13:51:27 +02:00
try
{
_logger.LogInformation("{ProcessorType}: Starting processing for {ProcessWorkerName} ({ProcessWorkerId})",
ProcessorType, processWorker.Name, processWorker.Id);
// Load configuration from layer records
LoadConfiguration(processWorker);
// Validate required configuration
ValidateConfiguration();
// Perform the actual processing
PerformProcessing(processWorker);
_logger.LogInformation("{ProcessorType}: Successfully completed processing for {ProcessWorkerName}",
ProcessorType, processWorker.Name);
}
catch (Exception e)
{
_logger.LogError(e, "{ProcessorType}: Failed to process {ProcessWorkerName} ({ProcessWorkerId})",
ProcessorType, processWorker.Name, processWorker.Id);
throw;
}
}
private void LoadConfiguration(Layer processWorker)
{
if (processWorker.Records == null)
{
throw new InvalidOperationException("ProcessWorker has no records");
}
// Load year
var yearStr = GetRecordValue(processWorker.Records, "Year");
if (string.IsNullOrEmpty(yearStr) || !int.TryParse(yearStr, out var year))
{
throw new InvalidOperationException("Year record not found or invalid");
}
Year = year;
// Load source
Source = GetRecordValue(processWorker.Records, "Source");
if (string.IsNullOrEmpty(Source))
{
throw new InvalidOperationException("Source record not found");
}
_logger.LogDebug("{ProcessorType}: Configuration loaded - Year: {Year}, Source: {Source}",
ProcessorType, Year, Source);
}
private void ValidateConfiguration()
{
var errors = new List<string>();
if (Year < 2000 || Year > 3000) errors.Add($"Invalid year: {Year}");
if (string.IsNullOrEmpty(Source)) errors.Add("Source is required");
if (errors.Any())
{
2025-06-07 13:51:27 +02:00
throw new InvalidOperationException($"Configuration validation failed: {string.Join(", ", errors)}");
}
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Configuration validation passed", ProcessorType);
}
private void PerformProcessing(Layer processWorker)
{
_logger.LogDebug("{ProcessorType}: Processing data for Year: {Year}, Source: {Source}",
ProcessorType, Year, Source);
// Get or create processed layer
var processedLayer = GetOrCreateProcessedLayer(processWorker);
// Get data sources
var dataSources = GetDataSources();
// Process records
var newRecords = ProcessRecords(dataSources);
// Save results
SaveProcessedLayer(processedLayer, newRecords);
// Update Google Sheet report
2025-11-25 15:07:41 +01:00
UpdateGoogleSheetReport(processedLayer.Id);
2025-06-07 13:51:27 +02:00
_logger.LogInformation("{ProcessorType}: Successfully processed {RecordCount} records for layer {LayerName} ({LayerId})",
ProcessorType, newRecords.Count, processedLayer.Name, processedLayer.Id);
}
private Layer GetOrCreateProcessedLayer(Layer processWorker)
{
2025-06-02 16:54:33 +02:00
var processedLayer = _db.Layers
2025-06-07 13:51:27 +02:00
.Where(x => x.ParentId == processWorker.Id && !x.IsDeleted && !x.IsCancelled)
.OrderByDescending(x => x.CreatedAt)
.FirstOrDefault();
if (processedLayer == null)
{
processedLayer = new Layer
{
Id = Guid.NewGuid(),
Type = LayerType.Processed,
ParentId = processWorker.Id,
2025-06-07 13:51:27 +02:00
Number = _db.Layers.Count() + 1,
CreatedById = Guid.Parse("F392209E-123E-4651-A5A4-0B1D6CF9FF9D"),
ModifiedById = Guid.Parse("F392209E-123E-4651-A5A4-0B1D6CF9FF9D"),
CreatedAt = DateTime.UtcNow,
ModifiedAt = DateTime.UtcNow
};
2025-06-07 13:51:27 +02:00
processedLayer.Name = $"L{processedLayer.Number}-P-{Year}-R3-T1";
_logger.LogDebug("{ProcessorType}: Created new processed layer {LayerName}",
ProcessorType, processedLayer.Name);
}
else
{
processedLayer.ModifiedById = Guid.Parse("F392209E-123E-4651-A5A4-0B1D6CF9FF9D");
processedLayer.ModifiedAt = DateTime.UtcNow;
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Using existing processed layer {LayerName}",
ProcessorType, processedLayer.Name);
}
2025-06-07 13:51:27 +02:00
return processedLayer;
}
2025-06-07 13:51:27 +02:00
private List<Layer> GetDataSources()
{
string pattern = @$"^L\d+-P-{Year}/\d+-{Source}-T5$";
2025-06-02 16:54:33 +02:00
var dataSources = _db.Layers
.Where(x => !x.IsDeleted && !x.IsCancelled)
.Include(layer => layer.Records!)
.AsNoTracking()
.AsEnumerable()
.Where(x => Regex.IsMatch(x.Name!, pattern))
.ToList();
2025-06-07 13:51:27 +02:00
if (dataSources.Count == 0)
{
throw new InvalidOperationException($"No data sources found for pattern: {pattern}");
}
_logger.LogDebug("{ProcessorType}: Found {DataSourceCount} data sources matching pattern {Pattern}",
ProcessorType, dataSources.Count, pattern);
return dataSources;
}
private List<Record> ProcessRecords(List<Layer> dataSources)
{
var newRecords = new List<Record>();
foreach (var dataSource in dataSources)
{
2025-06-07 13:51:27 +02:00
var monthStr = ProcessHelper.ExtractMonthFromLayerName(dataSource.Name!);
if (monthStr == null || !int.TryParse(monthStr, out var month))
{
2025-06-07 13:51:27 +02:00
_logger.LogWarning("{ProcessorType}: Could not extract month from layer name: {LayerName}",
ProcessorType, dataSource.Name);
continue;
}
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Processing data source {LayerName} for month {Month}",
ProcessorType, dataSource.Name, month);
var sourceRecords = ProcessDataSourceRecords(dataSource, month);
newRecords.AddRange(sourceRecords);
_logger.LogDebug("{ProcessorType}: Processed {RecordCount} records from source {LayerName}",
ProcessorType, sourceRecords.Count, dataSource.Name);
}
_logger.LogDebug("{ProcessorType}: Total processed records: {TotalRecordCount}",
ProcessorType, newRecords.Count);
return newRecords;
}
private List<Record> ProcessDataSourceRecords(Layer dataSource, int month)
{
var newRecords = new List<Record>();
2025-06-10 19:13:41 +02:00
// L8542-D-DEPARTMENTS
var dictionary = _db.Layers.Include(x => x.Records).FirstOrDefault(x => x.Number == 8542);
2025-06-07 13:51:27 +02:00
foreach (var record in dataSource.Records!)
{
if (record.Value1 == null)
{
_logger.LogDebug("{ProcessorType}: Skipping record {RecordCode} - Value1 is null",
ProcessorType, record.Code);
continue;
}
// Process values for positions 1-32
for (var i = 1; i < 33; i++)
{
2025-06-07 13:51:27 +02:00
var value = ProcessHelper.GetValue(record, i);
if (value == null)
{
2025-06-07 13:51:27 +02:00
continue;
}
2025-06-07 13:51:27 +02:00
var baseValue = (double)record.Value1!;
var positionValue = (double)value;
var calculatedValue = i == 1 ? baseValue : baseValue * positionValue / 100;
var newRecord = new Record
{
Id = Guid.NewGuid(),
Code = $"{record.Code}{month:D2}{i:D2}",
CreatedAt = DateTime.UtcNow,
ModifiedAt = DateTime.UtcNow,
Value1 = calculatedValue,
Desc1 = record.Desc1
};
newRecords.Add(newRecord);
_logger.LogDebug("{ProcessorType}: Created record {NewRecordCode} with value {Value} from {OriginalCode}",
ProcessorType, newRecord.Code, newRecord.Value1, record.Code);
}
}
2025-06-07 13:51:27 +02:00
return newRecords;
}
private void SaveProcessedLayer(Layer processedLayer, List<Record> newRecords)
{
var existsInDb = _db.Layers.Any(x => x.Id == processedLayer.Id);
if (!existsInDb)
{
2025-06-02 16:54:33 +02:00
_db.Layers.Add(processedLayer);
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Added new processed layer to database", ProcessorType);
}
else
{
2025-06-02 16:54:33 +02:00
_db.Layers.Update(processedLayer);
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Updated existing processed layer in database", ProcessorType);
}
2025-06-02 18:53:25 +02:00
SaveRecords(processedLayer.Id, newRecords);
2025-06-02 16:54:33 +02:00
_db.SaveChanges();
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Saved {RecordCount} records for layer {LayerId}",
ProcessorType, newRecords.Count, processedLayer.Id);
}
2025-06-02 18:53:25 +02:00
private void SaveRecords(Guid layerId, ICollection<Record> records)
{
2025-06-07 13:51:27 +02:00
// Remove existing records for this layer
2025-06-02 18:53:25 +02:00
var toDelete = _db.Records.Where(x => x.LayerId == layerId).ToList();
if (toDelete.Count > 0)
{
_db.Records.RemoveRange(toDelete);
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Removed {DeletedCount} existing records for layer {LayerId}",
ProcessorType, toDelete.Count, layerId);
2025-06-02 18:53:25 +02:00
}
2025-06-07 13:51:27 +02:00
// Add new records
2025-06-02 18:53:25 +02:00
foreach (var record in records)
{
record.CreatedById = Guid.Parse("F392209E-123E-4651-A5A4-0B1D6CF9FF9D");
record.CreatedAt = DateTime.UtcNow;
record.ModifiedById = Guid.Parse("F392209E-123E-4651-A5A4-0B1D6CF9FF9D");
record.ModifiedAt = DateTime.UtcNow;
record.LayerId = layerId;
_db.Records.Add(record);
}
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Added {RecordCount} new records for layer {LayerId}",
ProcessorType, records.Count, layerId);
2025-06-02 18:53:25 +02:00
}
2025-06-07 13:51:27 +02:00
private void UpdateGoogleSheetReport(Guid sourceId)
{
2025-06-07 13:51:27 +02:00
try
{
_logger.LogDebug("{ProcessorType}: Starting Google Sheet report update for layer {LayerId}",
ProcessorType, sourceId);
2025-06-07 13:51:27 +02:00
const string sheetId = "10Xo8BBF92nM7_JzzeOuWp49Gz8OsYuCxLDOeChqpW_8";
2025-06-07 13:51:27 +02:00
var processedLayer = _db.Layers
.Where(x => x.Id == sourceId)
.Include(x => x.Records)
.AsNoTracking()
.FirstOrDefault();
if (processedLayer == null)
{
throw new InvalidOperationException($"Processed layer {sourceId} not found");
}
// Update sheets for all months
for (var month = 1; month <= 12; month++)
{
UpdateMonthSheet(sheetId, processedLayer, month);
2025-06-08 12:33:22 +02:00
Thread.Sleep(1000);
2025-06-07 13:51:27 +02:00
}
_logger.LogInformation("{ProcessorType}: Successfully updated Google Sheet reports for all months",
ProcessorType);
}
catch (Exception e)
{
_logger.LogError(e, "{ProcessorType}: Failed to update Google Sheet report for layer {LayerId}",
ProcessorType, sourceId);
throw;
}
}
private void UpdateMonthSheet(string sheetId, Layer processedLayer, int month)
{
var sheetName = ProcessHelper.GetSheetName(month, Year);
try
{
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Updating sheet {SheetName} for month {Month}",
ProcessorType, sheetName, month);
// Get codes from sheet
ValueRange? dataRangeResponse;
try
{
2025-06-02 16:54:33 +02:00
dataRangeResponse = _googleSheetValues.Get(sheetId, $"{sheetName}!A7:A200").Execute();
}
2025-06-07 13:51:27 +02:00
catch (Exception e)
{
2025-06-07 13:51:27 +02:00
_logger.LogWarning("{ProcessorType}: Sheet {SheetName} not accessible, skipping - {Error}",
ProcessorType, sheetName, e.Message);
return;
}
2025-06-07 13:51:27 +02:00
if (dataRangeResponse?.Values == null)
{
2025-06-07 13:51:27 +02:00
_logger.LogWarning("{ProcessorType}: No data found in sheet {SheetName}, skipping",
ProcessorType, sheetName);
return;
}
2025-06-07 13:51:27 +02:00
// Update data
UpdateSheetData(sheetId, sheetName, processedLayer, dataRangeResponse.Values, month);
// Update timestamps
UpdateSheetTimestamps(sheetId, sheetName, processedLayer);
2025-06-07 13:51:27 +02:00
_logger.LogDebug("{ProcessorType}: Successfully updated sheet {SheetName}",
ProcessorType, sheetName);
}
catch (Exception e)
{
_logger.LogError(e, "{ProcessorType}: Failed to update sheet {SheetName} for month {Month}",
ProcessorType, sheetName, month);
throw;
}
}
private void UpdateSheetData(string sheetId, string sheetName, Layer processedLayer, IList<IList<object>> codeRows, int month)
{
var updateValueRange = new ValueRange
{
Values = new List<IList<object>>()
};
2025-06-07 13:51:27 +02:00
foreach (var row in codeRows)
{
if (row.Count == 0) continue;
var code = row[0].ToString();
var updateRow = new List<object>();
2025-06-10 19:13:41 +02:00
var department = "";
2025-06-07 13:51:27 +02:00
// Process columns C to Q (positions 1-15)
for (var position = 1; position <= 15; position++)
{
var recordCode = $"{code}{month:D2}{position:D2}";
var codeRecord = processedLayer.Records!.FirstOrDefault(x => x.Code == recordCode);
if (codeRecord?.Value1 != null)
{
2025-06-07 13:51:27 +02:00
updateRow.Add(codeRecord.Value1);
_logger.LogDebug("{ProcessorType}: Found value {Value} for code {RecordCode}",
ProcessorType, codeRecord.Value1, recordCode);
}
else
{
updateRow.Add("");
}
2025-06-10 19:13:41 +02:00
department = codeRecord?.Desc1 ?? "";
}
2025-06-10 19:13:41 +02:00
updateRow.Add(department);
2025-06-07 13:51:27 +02:00
updateValueRange.Values.Add(updateRow);
}
2025-06-07 13:51:27 +02:00
// Update sheet with new values
2025-06-10 19:13:41 +02:00
var update = _googleSheetValues.Update(updateValueRange, sheetId, $"{sheetName}!C7:R200");
2025-06-07 13:51:27 +02:00
update.ValueInputOption = SpreadsheetsResource.ValuesResource.UpdateRequest.ValueInputOptionEnum.USERENTERED;
update.Execute();
_logger.LogDebug("{ProcessorType}: Updated {RowCount} rows of data in sheet {SheetName}",
ProcessorType, updateValueRange.Values.Count, sheetName);
}
private void UpdateSheetTimestamps(string sheetId, string sheetName, Layer processedLayer)
{
var timeUtc = processedLayer.ModifiedAt.ToString("dd.MM.yyyy HH:mm:ss", CultureInfo.GetCultureInfo("pl-PL"));
var warsawTimeZone = TimeZoneInfo.FindSystemTimeZoneById("Central European Standard Time");
var warsawTime = TimeZoneInfo.ConvertTimeFromUtc(processedLayer.ModifiedAt.ToUniversalTime(), warsawTimeZone);
var timeWarsaw = warsawTime.ToString("dd.MM.yyyy HH:mm:ss", CultureInfo.GetCultureInfo("pl-PL"));
var valueRangeTime = new ValueRange
{
Values = new List<IList<object>>
{
2025-06-07 13:51:27 +02:00
new List<object> { timeUtc },
new List<object> { timeWarsaw }
}
};
2025-06-07 13:51:27 +02:00
var updateTime = _googleSheetValues.Update(valueRangeTime, sheetId, $"{sheetName}!G1:G2");
updateTime.ValueInputOption = SpreadsheetsResource.ValuesResource.UpdateRequest.ValueInputOptionEnum.USERENTERED;
updateTime.Execute();
_logger.LogDebug("{ProcessorType}: Updated timestamps in sheet {SheetName} - UTC: {TimeUtc}, Warsaw: {TimeWarsaw}",
ProcessorType, sheetName, timeUtc, timeWarsaw);
}
private string? GetRecordValue(ICollection<Record> records, string code)
{
return records.FirstOrDefault(x => x.Code == code)?.Desc1;
}
}