Skip to content

Commit

Permalink
chore(indicatorrecord): Create all sourcing records refactor 1st prot…
Browse files Browse the repository at this point in the history
…otype
  • Loading branch information
KevSanchez committed Aug 30, 2022
1 parent 4cc5f31 commit c62d168
Show file tree
Hide file tree
Showing 3 changed files with 223 additions and 77 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@ import { IndicatorsModule } from 'modules/indicators/indicators.module';
import { MaterialsModule } from 'modules/materials/materials.module';
import { SourcingRecordsModule } from 'modules/sourcing-records/sourcing-records.module';
import { CachedDataModule } from 'modules/cached-data/cached-data.module';
import { ImpactCalculatorService } from 'modules/indicator-records/services/impact-calculator.service';

@Module({
imports: [
Expand All @@ -19,7 +20,7 @@ import { CachedDataModule } from 'modules/cached-data/cached-data.module';
CachedDataModule,
],
controllers: [IndicatorRecordsController],
providers: [IndicatorRecordsService],
providers: [IndicatorRecordsService, ImpactCalculatorService],
exports: [IndicatorRecordsService],
})
export class IndicatorRecordsModule {}
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,7 @@ import {
CACHED_DATA_TYPE,
CachedData,
} from 'modules/cached-data/cached.data.entity';
import { ImpactCalculatorService } from 'modules/indicator-records/services/impact-calculator.service';

export interface CachedRawValue {
rawValue: number;
Expand All @@ -51,6 +52,7 @@ export class IndicatorRecordsService extends AppBaseService<
constructor(
@InjectRepository(IndicatorRecordRepository)
private readonly indicatorRecordRepository: IndicatorRecordRepository,
private readonly impactCalculatorService: ImpactCalculatorService,
private readonly indicatorService: IndicatorsService,
private readonly h3DataService: H3DataService,
private readonly materialsToH3sService: MaterialsToH3sService,
Expand Down
295 changes: 219 additions & 76 deletions api/src/modules/indicator-records/services/impact-calculator.service.ts
Original file line number Diff line number Diff line change
@@ -1,92 +1,230 @@
import { Connection, getConnection, QueryRunner, Repository, SelectQueryBuilder } from "typeorm";
import { Logger } from '@nestjs/common';
import {
Connection,
EntityRepository,
getConnection,
QueryRunner,
Repository,
SelectQueryBuilder,
} from 'typeorm';
import { Injectable, Logger } from '@nestjs/common';
import { SaveOptions } from 'typeorm/repository/SaveOptions';
import { MATERIAL_TO_H3_TYPE } from '../../materials/material-to-h3.entity';
import { MATERIAL_TO_H3_TYPE } from 'modules/materials/material-to-h3.entity';
import { H3DataService } from 'modules/h3-data/h3-data.service';
import { H3Data } from 'modules/h3-data/h3-data.entity';
import { INDICATOR_TYPES } from 'modules/indicators/indicator.entity';
import { SourcingRecordsWithIndicatorRawDataDto } from '../../sourcing-records/dto/sourcing-records-with-indicator-raw-data.dto';

export abstract class AppBaseRepository<Entity> extends Repository<Entity> {
@Injectable()
export class ImpactCalculatorService {
logger: Logger = new Logger(this.constructor.name);

async calculateImpact<Entity>(
georegionId: string,
materialH3Id: string,
materialType: MATERIAL_TO_H3_TYPE,
constructor(private readonly h3DataService: H3DataService) {}

async calculateImpact(
connection: Connection,
queryRunner: QueryRunner,
georegionId: string,
materialId: string,
year: number,
options?: SaveOptions,
): Promise<Entity[]> {
): Promise<any[]> {
// MAIN LOGIC

// STEPS
/**
* 1. Get material h3 data table and column name
* 1.1 For each year, get the closest available material h3 data
* 2. Get indicator h3 data table and column name
* 2.1 For each year, get the closest available material h3 data
** Look at how interventions impact calculus implements this.
*
* 2.1 Get deforestation indicator h3 data and column name (because this indicator needs to be crossed with this data)
*
* CRAZY IDEAZ:
* 1. We have 12 years to calculate impact: 2010-2022 (12 DB calls)
* 2. We have 3 available years to calculate impact: 2010, 2014, 2020
*
* Before performing any call, can we determine that Sourcing Records from 2010 to 2012 will use data of 2010
* from 2013 to 2017 will use data of 2014
* from 2018 to 2022 will use data of 2022
*
* Knowing this, can we calculate impacts for those years simultaneosly (arent we doing that now anyway?) in 3 DB CALLS
* instead of doing 12, each for one year?
*
* LONG STORY SHORT:
*
* Can we do as much calls as different h3 data tables we need to attack (in this case 3)
* instead of doing as much calls as years we have to calculate impact for(in this case 12)
*
*There's another problem; every indicator/material might not have data available for the same years, an indicator having
* data for 2010 and 2020, and another indicator for 2012 and 2017
* seems like the root of the problem might be pretty early in the process, when deciding what (or more likely when) data to use
* for calculations
* what are the possible strategies to calculate the gap years? shgould it be configurable AFTER deployment?
* closest? that might be resolved by copying columns on the H3 info table on the H3 import
* mean between the closest ones? that's more difficult, might be possible in the H3 import? but it would be something
* not configurable once deployed
*
*
*/

const materialH3s: Map<MATERIAL_TO_H3_TYPE, H3Data> =
await this.h3DataService.getAllMaterialH3sByClosestYear(materialId, year);
const indicatorH3s: Map<INDICATOR_TYPES, H3Data> =
await this.h3DataService.getIndicatorH3sByTypeAndClosestYear(
Object.values(INDICATOR_TYPES),
year,
);
const producerH3: H3Data = materialH3s.get(MATERIAL_TO_H3_TYPE.PRODUCER)!;
const harvestH3: H3Data = materialH3s.get(MATERIAL_TO_H3_TYPE.HARVEST)!;
const bioH3: H3Data = indicatorH3s.get(INDICATOR_TYPES.BIODIVERSITY_LOSS)!;
const deforestH3: H3Data = indicatorH3s.get(INDICATOR_TYPES.DEFORESTATION)!;
const carbonH3: H3Data = indicatorH3s.get(
INDICATOR_TYPES.CARBON_EMISSIONS,
)!;
const waterH3: H3Data = indicatorH3s.get(
INDICATOR_TYPES.UNSUSTAINABLE_WATER_USE,
)!;

const values: SelectQueryBuilder<unknown> = await connection
.createQueryBuilder()

.select(`sum( "harvestH3"."${harvestH3.h3columnName}" )`, 'harvestedArea')
.addSelect(
`sum( "producerH3"."${producerH3.h3columnName}" )`,
'production',
)
.addSelect(
`sum( "harvestH3"."${harvestH3.h3columnName}" * "deforestH3"."${deforestH3.h3columnName}" ` +
`* "bioH3"."${bioH3.h3columnName}" * (1/0.0001) )`,
'rawBiodiversity',
)
.addSelect(
`sum( "harvestH3"."${harvestH3.h3columnName}" * "deforestH3"."${deforestH3.h3columnName}" ` +
`* "carbonH3"."${carbonH3.h3columnName}")`,
'rawCarbon',
)
.addSelect(
`sum( "harvestH3"."${harvestH3.h3columnName}" * "deforestH3"."${deforestH3.h3columnName}" )`,
'rawDeforestation',
)
.addSelect(
`sum( "waterH3"."${waterH3.h3columnName}" * 0.001)`,
'rawWater',
)
.from(
`(select * from get_h3_uncompact_geo_region('${georegionId}', 6))`,
'geoRegion',
)
.innerJoin(
producerH3.h3tableName,
'producerH3',
`"producerH3".h3index = "geoRegion".h3index`,
)
.innerJoin(
harvestH3.h3tableName,
'harvestH3',
`"harvestH3".h3index = "geoRegion".h3index`,
)
.innerJoin(
bioH3.h3tableName,
'bioH3',
'"bioH3".h3index = "geoRegion".h3index',
)
.innerJoin(
carbonH3.h3tableName,
'carbonH3',
'"carbonH3".h3index = "geoRegion".h3index',
)
.innerJoin(
deforestH3.h3tableName,
'deforestH3',
'"deforestH3".h3index = "geoRegion".h3index',
)
.innerJoin(
waterH3.h3tableName,
'waterH3',
'"waterH3".h3index = "geoRegion".h3index',
);

const result: any = await queryRunner.query(values.getQuery());
if (!result.length)
this.logger.warn(
`Could not retrieve Sourcing Records with weighted indicator values`,
);
return result[0];
}

async calculateAllSourcingRecords(): Promise<
SourcingRecordsWithIndicatorRawDataDto[]
> {
const connection: Connection = getConnection();
const queryRunner: QueryRunner = connection.createQueryRunner();
await queryRunner.connect();
await queryRunner.startTransaction();
const result: Entity[][] = [];

let result: SourcingRecordsWithIndicatorRawDataDto[] = [];
try {
// MAIN LOGIC

// STEPS
/**
* 1. Get material h3 data table and column name
* 1.1 For each year, get the closest available material h3 data
* 2. Get indicator h3 data table and column name
* 2.1 For each year, get the closest available material h3 data
** Look at how interventions impact calculus implements this.
*
* 2.1 Get deforestation indicator h3 data and column name (because this indicator needs to be crossed with this data)
*
* CRAZY IDEAZ:
* 1. We have 12 years to calculate impact: 2010-2022 (12 DB calls)
* 2. We have 3 available years to calculate impact: 2010, 2014, 2020
*
* Before performing any call, can we determine that Sourcing Records from 2010 to 2012 will use data of 2010
* from 2013 to 2017 will use data of 2014
* from 2018 to 2022 will use data of 2022
*
* Knowing this, can we calculate impacts for those years simultaneosly (arent we doing that now anyway?) in 3 DB CALLS
* instead of doing 12, each for one year?
*
* LONG STORY SHORT:
*
* Can we do as much calls as different h3 data tables we need to attack (in this case 3)
* instead of doing as much calls as years we have to calculate impact for(in this case 12)
*
*
*
*/
let materialH3data: any;
let indictorH3Data: any;

const result: any = await this.createQueryBuilder().select([
'sr.id as "sourcingRecordId",\n sr.tonnage,\n sr.year,\n slwithmaterialh3data.id as "sourcingLocationId",\n slwithmaterialh3data.production,\n slwithmaterialh3data."harvestedArea",\n slwithmaterialh3data."rawDeforestation",\n slwithmaterialh3data."rawBiodiversity",\n slwithmaterialh3data."rawCarbon",\n slwithmaterialh3data."rawWater",\n slwithmaterialh3data."materialH3DataId"',
]).from((subQuery: SelectQueryBuilder<any> )=> subQuery.select(`sum()`)
.from(`get_h3_uncompact_geo_region($1, $2)`, 'geoRegion')
.innerJoin('$3', 'materialH3', `materialH3.h3index = geoRegion.h3index`)
const sourcingRecordsQuery: SelectQueryBuilder<unknown> = connection
.createQueryBuilder()
.select([
`sr.id as "sourcingRecordId",
sr.tonnage,
sr.year,
sl.id as "sourcingLocationId",
sl."materialId",
sl."geoRegionId",
mth."h3DataId" as "materialH3DataId"`,
])
.from('sourcing_records', 'sr')
.innerJoin('sourcing_location', 'sl', 'sl.id = sr."sourcingLocationId"')
.innerJoin(
'$4',
'bioDiversityh3',
'bioDiversityh3.h3index = geoRegion.h3index',
(subQuery: SelectQueryBuilder<any>) => {
return subQuery
.select('"materialId"')
.addSelect('"h3DataId"')
.from('material_to_h3', 'material_to_h3')
.where(`type='${MATERIAL_TO_H3_TYPE.HARVEST}'`);
},
'mth',
'mth."materialId" = sl."materialId"',
)
.innerJoin(
'$5',
'deforestationH3',
'deforestation.h3index = geoRegion.h3index',
);

// This
const data: any = await this.createQueryBuilder()
.select(`sum()`)
.from(`get_h3_uncompact_geo_region($1, $2)`, 'geoRegion')
.innerJoin('$3', 'materialH3', `materialH3.h3index = geoRegion.h3index`)
.innerJoin(
'$4',
'bioDiversityh3',
'bioDiversityh3.h3index = geoRegion.h3index',
)
.innerJoin(
'$5',
'deforestationH3',
'deforestation.h3index = geoRegion.h3index',
);
// commit transaction if every chunk was saved successfully
.where('sl."scenarioInterventionId" IS NULL')
.andWhere('sl."interventionType" IS NULL');

const sourcingRecords: any[] = await queryRunner.query(
sourcingRecordsQuery.getQuery(),
);
result = await Promise.all(
sourcingRecords.map(async (sourcingRecord: any) => {
const rawValues: any = await this.calculateImpact(
connection,
queryRunner,
sourcingRecord.geoRegionId,
sourcingRecord.materialId,
sourcingRecord.year,
);

return {
sourcingRecordId: sourcingRecord.sourcingRecordId,
tonnage: sourcingRecord.tonnage,
year: sourcingRecord.year,

sourcingLocationId: sourcingRecord.sourcingLocationId,
production: rawValues.production,
harvestedArea: rawValues.harvestedArea,

rawDeforestation: rawValues.rawDeforestation,
rawBiodiversity: rawValues.rawBiodiversity,
rawCarbon: rawValues.rawCarbon,
rawWater: rawValues.rawWater,

materialH3DataId: sourcingRecord.materialH3DataId,
};
}),
);

await queryRunner.commitTransaction();
} catch (err) {
// rollback changes before throwing error
Expand All @@ -96,6 +234,11 @@ export abstract class AppBaseRepository<Entity> extends Repository<Entity> {
// release query runner which is manually created
await queryRunner.release();
}
return result.flat();

if (!result.length) {
throw new Error('No raw impact data could be calculated');
}

return result;
}
}

0 comments on commit c62d168

Please sign in to comment.