Skip to content

Commit 7e105bc

Browse files
committed
NC | Lifecycle | Adjust expire/noncurrent state properties to GPFS flow
Signed-off-by: Romy <35330373+romayalon@users.noreply.github.com>
1 parent 947eb7f commit 7e105bc

File tree

1 file changed

+30
-14
lines changed

1 file changed

+30
-14
lines changed

src/manage_nsfs/nc_lifecycle.js

Lines changed: 30 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -47,6 +47,12 @@ const TIMED_OPS = Object.freeze({
4747
DELETE_MULTIPLE_OBJECTS: 'delete_multiple_objects'
4848
});
4949

50+
/**
51+
* @typedef {{
52+
* is_finished?: Boolean | Undefined,
53+
* expire?: { is_finished?: Boolean | Undefined, key_marker?: String | Undefined, candidates_file_offset?: number | undefined}
54+
* noncurrent?: { is_finished?: Boolean | Undefined, key_marker_versioned?: String | Undefined, version_id_marker?: String | Undefined }}} RuleState
55+
*/
5056

5157
class NCLifecycle {
5258
constructor(config_fs, options = {}) {
@@ -265,7 +271,7 @@ class NCLifecycle {
265271
if (candidates.delete_candidates?.length > 0) {
266272
const expiration = lifecycle_rule.expiration ? this._get_expiration_time(lifecycle_rule.expiration) : 0;
267273
const filter_func = this._build_lifecycle_filter({filter: lifecycle_rule.filter, expiration});
268-
274+
dbg.log0('process_rule: calling delete_multiple_objects, num of objects to be deleted', candidates.delete_candidates.length);
269275
const delete_res = await this._call_op_and_update_status({
270276
bucket_name,
271277
rule_id,
@@ -282,6 +288,7 @@ class NCLifecycle {
282288
}
283289

284290
if (candidates.abort_mpu_candidates?.length > 0) {
291+
dbg.log0('process_rule: calling delete_multiple_objects, num of mpu to be aborted', candidates.delete_candidates.length);
285292
await this._call_op_and_update_status({
286293
bucket_name,
287294
rule_id,
@@ -465,7 +472,7 @@ class NCLifecycle {
465472
* @returns {Promise<Object[]>}
466473
*/
467474
async get_candidates_by_expiration_rule_posix(lifecycle_rule, bucket_json, object_sdk) {
468-
const rule_state = this.lifecycle_run_status.buckets_statuses[bucket_json.name].rules_statuses[lifecycle_rule.id].state.expire;
475+
const rule_state = this._get_rule_state(bucket_json, lifecycle_rule).expire;
469476
if (rule_state.is_finished) return [];
470477
const expiration = this._get_expiration_time(lifecycle_rule.expiration);
471478
if (expiration < 0) return [];
@@ -520,7 +527,7 @@ class NCLifecycle {
520527
* @returns {Promise<Object[]>}
521528
*/
522529
async get_candidates_by_expiration_delete_marker_rule(lifecycle_rule, bucket_json, object_sdk, {versions_list}) {
523-
const rule_state = this.lifecycle_run_status.buckets_statuses[bucket_json.name].rules_statuses[lifecycle_rule.id].state.noncurrent;
530+
const rule_state = this._get_rule_state(bucket_json, lifecycle_rule).noncurrent;
524531
if (rule_state.is_finished) return [];
525532
if (!versions_list) {
526533
versions_list = await this.load_versions_list(object_sdk, lifecycle_rule, bucket_json, rule_state);
@@ -619,7 +626,7 @@ class NCLifecycle {
619626
* @returns {Promise<Object[]>}
620627
*/
621628
async get_candidates_by_noncurrent_version_expiration_rule(lifecycle_rule, bucket_json, object_sdk, {versions_list}) {
622-
const rule_state = this.lifecycle_run_status.buckets_statuses[bucket_json.name].rules_statuses[lifecycle_rule.id].state.noncurrent;
629+
const rule_state = this._get_rule_state(bucket_json, lifecycle_rule).noncurrent;
623630
if (rule_state.is_finished) return [];
624631

625632
if (!versions_list) {
@@ -965,7 +972,7 @@ class NCLifecycle {
965972
*/
966973
init_rule_status(bucket_name, rule_id) {
967974
this.lifecycle_run_status.buckets_statuses[bucket_name].rules_statuses[rule_id] ??= {};
968-
this.lifecycle_run_status.buckets_statuses[bucket_name].rules_statuses[rule_id].state ??= {expire: {}, noncurrent: {}};
975+
this.lifecycle_run_status.buckets_statuses[bucket_name].rules_statuses[rule_id].state ??= { expire: {}, noncurrent: {} };
969976
this.lifecycle_run_status.buckets_statuses[bucket_name].rules_statuses[rule_id].rule_process_times = {};
970977
this.lifecycle_run_status.buckets_statuses[bucket_name].rules_statuses[rule_id].rule_stats ??= {};
971978
return this.lifecycle_run_status.buckets_statuses[bucket_name].rules_statuses[rule_id];
@@ -977,7 +984,7 @@ class NCLifecycle {
977984
* @param {string} rule_id
978985
*/
979986
update_rule_status_is_finished(bucket_name, rule_id) {
980-
const rule_state = this.lifecycle_run_status.buckets_statuses[bucket_name].rules_statuses[rule_id].state;
987+
const rule_state = this._get_rule_state({ name: bucket_name }, { id: rule_id });
981988
rule_state.is_finished = (rule_state.expire.is_finished === undefined || rule_state.expire.is_finished === true) &&
982989
(rule_state.noncurrent.is_finished === undefined || rule_state.noncurrent.is_finished === true);
983990
}
@@ -1011,18 +1018,20 @@ class NCLifecycle {
10111018
* _set_rule_state sets the current rule state on the lifecycle run status
10121019
* @param {Object} bucket_json
10131020
* @param {*} lifecycle_rule
1014-
* @param {{is_finished?: Boolean | Undefined, candidates_file_offset?: number | undefined}} rule_state
1021+
* @param {RuleState} rule_state
10151022
* @returns {Void}
10161023
*/
10171024
_set_rule_state(bucket_json, lifecycle_rule, rule_state) {
1018-
this.lifecycle_run_status.buckets_statuses[bucket_json.name].rules_statuses[lifecycle_rule.id].state = rule_state;
1025+
const existing_state = this._get_rule_state(bucket_json, lifecycle_rule);
1026+
const new_state = { ...existing_state, ...rule_state };
1027+
this.lifecycle_run_status.buckets_statuses[bucket_json.name].rules_statuses[lifecycle_rule.id].state = new_state;
10191028
}
10201029

10211030
/**
10221031
* _get_rule_state gets the current rule state on the lifecycle run status
10231032
* @param {Object} bucket_json
10241033
* @param {*} lifecycle_rule
1025-
* @returns {{is_finished?: Boolean | Undefined, candidates_file_offset?: number | undefined}} rule_state
1034+
* @returns {RuleState}
10261035
*/
10271036
_get_rule_state(bucket_json, lifecycle_rule) {
10281037
return this.lifecycle_run_status.buckets_statuses[bucket_json.name].rules_statuses[lifecycle_rule.id].state;
@@ -1164,6 +1173,7 @@ class NCLifecycle {
11641173
for (const bucket_name of bucket_names) {
11651174
const bucket_json = await this.config_fs.get_bucket_by_name(bucket_name, config_fs_options);
11661175
const bucket_mount_point = this.find_mount_point_by_bucket_path(mount_point_to_policy_map, bucket_json.path);
1176+
if (!bucket_json.lifecycle_configuration_rules?.length) continue;
11671177
for (const lifecycle_rule of bucket_json.lifecycle_configuration_rules) {
11681178
// currently we support expiration (current version) only
11691179
if (lifecycle_rule.expiration) {
@@ -1377,22 +1387,28 @@ class NCLifecycle {
13771387
* 1.2.2. parse the key from the candidate line
13781388
* 1.2.3. push the key to the candidates array
13791389
* 2. if candidates file does not exist, we return without error because it's valid that no candidates found
1390+
* GAP - when supporting noncurrent rule, we should update the state type to noncurrent based on the candidates file path
13801391
* @param {Object} bucket_json
13811392
* @param {*} lifecycle_rule
13821393
* @param {String} rule_candidates_path
13831394
* @returns {Promise<Object[]>} parsed_candidates_array
13841395
*/
13851396
async parse_candidates_from_gpfs_ilm_policy(bucket_json, lifecycle_rule, rule_candidates_path) {
13861397
let reader;
1398+
const state_type = 'expire';
1399+
const rule_state = this._get_rule_state(bucket_json, lifecycle_rule)?.[state_type];
1400+
dbg.log2(`parse_candidates_from_gpfs_ilm_policy rule_state=${rule_state} state_type=${state_type}, currently on gpfs ilm flow - we support only expiration rule`);
1401+
if (rule_state?.is_finished) return [];
1402+
const finished_state = { [state_type]: { is_finished: true, candidates_file_offset: undefined } };
1403+
13871404
try {
1388-
const rule_state = this._get_rule_state(bucket_json, lifecycle_rule);
13891405
dbg.log2(`parse_candidates_from_gpfs_ilm_policy bucket_name=${bucket_json.name}, rule_id ${lifecycle_rule.id}, existing rule_state=${util.inspect(rule_state)}`);
1390-
13911406
const parsed_candidates_array = [];
13921407
reader = new NewlineReader(this.non_gpfs_fs_context, rule_candidates_path, { lock: 'SHARED', read_file_offset: rule_state?.candidates_file_offset || 0 });
1408+
13931409
const [count, is_finished] = await reader.forEachFilePathEntry(async entry => {
13941410
if (parsed_candidates_array.length >= config.NC_LIFECYCLE_LIST_BATCH_SIZE) return false;
1395-
const cur_rule_state = { is_finished: false, candidates_file_offset: reader.next_line_file_offset };
1411+
const cur_rule_state = { [state_type]: { is_finished: false, candidates_file_offset: reader.next_line_file_offset } };
13961412
this._set_rule_state(bucket_json, lifecycle_rule, cur_rule_state);
13971413
const key = this._parse_key_from_line(entry, bucket_json);
13981414
// TODO - need to add etag, size, version_id
@@ -1402,14 +1418,14 @@ class NCLifecycle {
14021418
});
14031419

14041420
if (is_finished) {
1405-
this._set_rule_state(bucket_json, lifecycle_rule, { is_finished: true, candidates_file_offset: undefined });
1421+
this._set_rule_state(bucket_json, lifecycle_rule, finished_state);
14061422
}
14071423
dbg.log2(`parse_candidates_from_gpfs_ilm_policy: parsed_candidates_array ${util.inspect(parsed_candidates_array)}, rule_state=${util.inspect(rule_state)}, count=${count} is_finished=${is_finished}`);
14081424
return parsed_candidates_array;
14091425
} catch (err) {
14101426
if (err.code === 'ENOENT') {
14111427
dbg.log2(`parse_candidates_from_gpfs_ilm_policy ilm_candidates_file_exists does not exist, no candidates to delete`);
1412-
this._set_rule_state(bucket_json, lifecycle_rule, { is_finished: true, candidates_file_offset: undefined });
1428+
this._set_rule_state(bucket_json, lifecycle_rule, finished_state);
14131429
return;
14141430
}
14151431
dbg.error('parse_candidates_from_gpfs_ilm_policy: error', err);

0 commit comments

Comments
 (0)