Browse Source

CLDC-2369 Spreadsheet dupe (#1663)

* remove dead code

* handle spreadsheet dupes in lettings

* handle spreadsheet dupes in sales

* update error message

* use feature flag
pull/1688/head
Phil Lee 2 years ago committed by GitHub
parent
commit
c5842122d7
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
  1. 32
      app/services/bulk_upload/lettings/validator.rb
  2. 23
      app/services/bulk_upload/lettings/year2022/row_parser.rb
  3. 23
      app/services/bulk_upload/lettings/year2023/row_parser.rb
  4. 1
      app/services/bulk_upload/sales/log_creator.rb
  5. 19
      app/services/bulk_upload/sales/validator.rb
  6. 21
      app/services/bulk_upload/sales/year2022/row_parser.rb
  7. 21
      app/services/bulk_upload/sales/year2023/row_parser.rb
  8. 11
      config/locales/en.yml
  9. 1
      spec/factories/sales_log.rb
  10. 17
      spec/services/bulk_upload/lettings/validator_spec.rb
  11. 12
      spec/services/bulk_upload/lettings/year2022/row_parser_spec.rb
  12. 12
      spec/services/bulk_upload/lettings/year2023/row_parser_spec.rb
  13. 16
      spec/services/bulk_upload/sales/validator_spec.rb
  14. 12
      spec/services/bulk_upload/sales/year2022/row_parser_spec.rb
  15. 12
      spec/services/bulk_upload/sales/year2023/row_parser_spec.rb
  16. 2
      spec/services/csv/sales_log_csv_service_spec.rb

32
app/services/bulk_upload/lettings/validator.rb

@ -1,5 +1,3 @@
require "csv"
class BulkUpload::Lettings::Validator class BulkUpload::Lettings::Validator
include ActiveModel::Validations include ActiveModel::Validations
@ -16,9 +14,11 @@ class BulkUpload::Lettings::Validator
end end
def call def call
row_parsers.each_with_index do |row_parser, index| row_parsers.each(&:valid?)
row_parser.valid?
validate_duplicate_rows if FeatureToggle.bulk_upload_duplicate_log_check_enabled?
row_parsers.each_with_index do |row_parser, index|
row = index + row_offset + 1 row = index + row_offset + 1
row_parser.errors.each do |error| row_parser.errors.each do |error|
@ -69,25 +69,25 @@ class BulkUpload::Lettings::Validator
errors.count == errors.where(category: "soft_validation").count && errors.count.positive? errors.count == errors.where(category: "soft_validation").count && errors.count.positive?
end end
def over_column_error_threshold? def any_logs_already_exist?
fields = ("field_1".."field_134").to_a row_parsers.any?(&:log_already_exists?)
percentage_threshold = (row_parsers.size * COLUMN_PERCENTAGE_ERROR_THRESHOLD).ceil end
fields.any? do |field| private
count = row_parsers.count { |row_parser| row_parser.errors[field].present? }
next if count < COLUMN_ABSOLUTE_ERROR_THRESHOLD # n^2 algo
def validate_duplicate_rows
row_parsers.each do |rp|
dupe = row_parsers.reject { |r| r.object_id.equal?(rp.object_id) }.any? do |rp_counter|
rp.spreadsheet_duplicate_hash == rp_counter.spreadsheet_duplicate_hash
end
count > percentage_threshold if dupe
rp.add_duplicate_found_in_spreadsheet_errors
end end
end end
def any_logs_already_exist?
row_parsers.any?(&:log_already_exists?)
end end
private
def any_logs_invalid? def any_logs_invalid?
row_parsers.any? { |row_parser| row_parser.log.invalid? } row_parsers.any? { |row_parser| row_parser.log.invalid? }
end end

23
app/services/bulk_upload/lettings/year2022/row_parser.rb

@ -438,6 +438,29 @@ class BulkUpload::Lettings::Year2022::RowParser
.exists?(duplicate_check_fields.index_with { |field| log.public_send(field) }) .exists?(duplicate_check_fields.index_with { |field| log.public_send(field) })
end end
def spreadsheet_duplicate_hash
attributes.slice(
"field_5", # location
"field_12", # age1
"field_20", # sex1
"field_35", # ecstat1
"field_84", # tcharge
"field_96", # startdate
"field_97", # startdate
"field_98", # startdate
"field_100", # propcode
"field_108", # postcode
"field_109", # postcode
"field_111", # owning org
)
end
def add_duplicate_found_in_spreadsheet_errors
spreadsheet_duplicate_hash.each_key do |field|
errors.add(field, :spreadsheet_dupe, category: :setup)
end
end
private private
def validate_declaration_acceptance def validate_declaration_acceptance

23
app/services/bulk_upload/lettings/year2023/row_parser.rb

@ -455,6 +455,29 @@ class BulkUpload::Lettings::Year2023::RowParser
.exists?(duplicate_check_fields.index_with { |field| log.public_send(field) }) .exists?(duplicate_check_fields.index_with { |field| log.public_send(field) })
end end
def spreadsheet_duplicate_hash
attributes.slice(
"field_1", # owning org
"field_7", # startdate
"field_8", # startdate
"field_9", # startdate
"field_14", # propcode
"field_17", # location
"field_23", # postcode
"field_24", # postcode
"field_46", # age1
"field_47", # sex1
"field_50", # ecstat1
"field_132", # tcharge
)
end
def add_duplicate_found_in_spreadsheet_errors
spreadsheet_duplicate_hash.each_key do |field|
errors.add(field, :spreadsheet_dupe, category: :setup)
end
end
private private
def validate_declaration_acceptance def validate_declaration_acceptance

1
app/services/bulk_upload/sales/log_creator.rb

@ -16,7 +16,6 @@ class BulkUpload::Sales::LogCreator
row_parser.log.bulk_upload = bulk_upload row_parser.log.bulk_upload = bulk_upload
row_parser.log.skip_update_status = true row_parser.log.skip_update_status = true
row_parser.log.status = "pending" row_parser.log.status = "pending"
row_parser.log.status_cache = row_parser.log.calculate_status row_parser.log.status_cache = row_parser.log.calculate_status
begin begin

19
app/services/bulk_upload/sales/validator.rb

@ -13,9 +13,11 @@ class BulkUpload::Sales::Validator
end end
def call def call
row_parsers.each_with_index do |row_parser, index| row_parsers.each(&:valid?)
row_parser.valid?
validate_duplicate_rows if FeatureToggle.bulk_upload_duplicate_log_check_enabled?
row_parsers.each_with_index do |row_parser, index|
row = index + row_offset + 1 row = index + row_offset + 1
row_parser.errors.each do |error| row_parser.errors.each do |error|
@ -67,6 +69,19 @@ class BulkUpload::Sales::Validator
private private
# n^2 algo
def validate_duplicate_rows
row_parsers.each do |rp|
dupe = row_parsers.reject { |r| r.object_id.equal?(rp.object_id) }.any? do |rp_counter|
rp.spreadsheet_duplicate_hash == rp_counter.spreadsheet_duplicate_hash
end
if dupe
rp.add_duplicate_found_in_spreadsheet_errors
end
end
end
def any_logs_invalid? def any_logs_invalid?
row_parsers.any? { |row_parser| row_parser.log.invalid? } row_parsers.any? { |row_parser| row_parser.log.invalid? }
end end

21
app/services/bulk_upload/sales/year2022/row_parser.rb

@ -411,6 +411,27 @@ class BulkUpload::Sales::Year2022::RowParser
field_1 field_1
end end
def spreadsheet_duplicate_hash
attributes.slice(
"field_1", # purcahser code
"field_2", # saledate
"field_3", # saledate
"field_4", # saledate
"field_7", # age1
"field_13", # sex1
"field_24", # ecstat1
"field_54", # postcode
"field_55", # postcode
"field_92", # owning org
)
end
def add_duplicate_found_in_spreadsheet_errors
spreadsheet_duplicate_hash.each_key do |field|
errors.add(field, :spreadsheet_dupe, category: :setup)
end
end
private private
def validate_data_protection_answered def validate_data_protection_answered

21
app/services/bulk_upload/sales/year2023/row_parser.rb

@ -533,6 +533,27 @@ class BulkUpload::Sales::Year2023::RowParser
field_6 field_6
end end
def spreadsheet_duplicate_hash
attributes.slice(
"field_1", # owning org
"field_3", # saledate
"field_4", # saledate
"field_5", # saledate
"field_6", # purchaser_code
"field_24", # postcode
"field_25", # postcode
"field_30", # age1
"field_31", # sex1
"field_35", # ecstat1
)
end
def add_duplicate_found_in_spreadsheet_errors
spreadsheet_duplicate_hash.each_key do |field|
errors.add(field, :spreadsheet_dupe, category: :setup)
end
end
private private
def validate_data_protection_answered def validate_data_protection_answered

11
config/locales/en.yml

@ -41,10 +41,17 @@ en:
activemodel: activemodel:
errors: errors:
models: models:
bulk_upload/sales/year2022/row_parser: bulk_upload/row_parser: &bulk_upload__row_parser__base
inclusion: Enter a valid value for %{question} inclusion: Enter a valid value for %{question}
spreadsheet_dupe: This is a duplicate of a log in your file
bulk_upload/lettings/year2022/row_parser:
<<: *bulk_upload__row_parser__base
bulk_upload/lettings/year2023/row_parser:
<<: *bulk_upload__row_parser__base
bulk_upload/sales/year2022/row_parser:
<<: *bulk_upload__row_parser__base
bulk_upload/sales/year2023/row_parser: bulk_upload/sales/year2023/row_parser:
inclusion: Enter a valid value for %{question} <<: *bulk_upload__row_parser__base
bulk_upload/lettings/validator: bulk_upload/lettings/validator:
attributes: attributes:
base: base:

1
spec/factories/sales_log.rb

@ -36,6 +36,7 @@ FactoryBot.define do
jointpur { 2 } jointpur { 2 }
end end
trait :completed do trait :completed do
purchid { rand(999_999_999).to_s }
ownershipsch { 2 } ownershipsch { 2 }
type { 8 } type { 8 }
saledate { Time.utc(2023, 2, 2, 10, 36, 49) } saledate { Time.utc(2023, 2, 2, 10, 36, 49) }

17
spec/services/bulk_upload/lettings/validator_spec.rb

@ -290,6 +290,23 @@ RSpec.describe BulkUpload::Lettings::Validator do
end end
end end
context "when duplicate rows present" do
let(:file) { Tempfile.new }
let(:path) { file.path }
let(:log) { build(:lettings_log, :completed) }
before do
file.write(BulkUpload::LettingsLogToCsv.new(log:, line_ending: "\r\n").default_2023_field_numbers_row)
file.write(BulkUpload::LettingsLogToCsv.new(log:, line_ending: "\r\n").to_2023_csv_row)
file.write(BulkUpload::LettingsLogToCsv.new(log:, line_ending: "\r\n").to_2023_csv_row)
file.close
end
it "creates errors" do
expect { validator.call }.to change(BulkUploadError.where(category: :setup, error: "This is a duplicate of a log in your file"), :count).by(24)
end
end
context "with unix line endings" do context "with unix line endings" do
let(:fixture_path) { file_fixture("2022_23_lettings_bulk_upload.csv") } let(:fixture_path) { file_fixture("2022_23_lettings_bulk_upload.csv") }
let(:file) { Tempfile.new } let(:file) { Tempfile.new }

12
spec/services/bulk_upload/lettings/year2022/row_parser_spec.rb

@ -1760,4 +1760,16 @@ RSpec.describe BulkUpload::Lettings::Year2022::RowParser do
end end
end end
end end
describe "#spreadsheet_duplicate_hash" do
it "returns a hash" do
expect(parser.spreadsheet_duplicate_hash).to be_a(Hash)
end
end
describe "#add_duplicate_found_in_spreadsheet_errors" do
it "adds errors" do
expect { parser.add_duplicate_found_in_spreadsheet_errors }.to change(parser.errors, :size)
end
end
end end

12
spec/services/bulk_upload/lettings/year2023/row_parser_spec.rb

@ -1830,4 +1830,16 @@ RSpec.describe BulkUpload::Lettings::Year2023::RowParser do
end end
end end
end end
describe "#spreadsheet_duplicate_hash" do
it "returns a hash" do
expect(parser.spreadsheet_duplicate_hash).to be_a(Hash)
end
end
describe "#add_duplicate_found_in_spreadsheet_errors" do
it "adds errors" do
expect { parser.add_duplicate_found_in_spreadsheet_errors }.to change(parser.errors, :size)
end
end
end end

16
spec/services/bulk_upload/sales/validator_spec.rb

@ -125,6 +125,22 @@ RSpec.describe BulkUpload::Sales::Validator do
expect { validator.call }.to change(BulkUploadError, :count) expect { validator.call }.to change(BulkUploadError, :count)
end end
end end
context "when duplicate rows present" do
let(:file) { Tempfile.new }
let(:path) { file.path }
let(:log) { build(:sales_log, :completed) }
before do
file.write(BulkUpload::SalesLogToCsv.new(log:, col_offset: 0).to_2022_csv_row)
file.write(BulkUpload::SalesLogToCsv.new(log:, col_offset: 0).to_2022_csv_row)
file.close
end
it "creates errors" do
expect { validator.call }.to change(BulkUploadError.where(category: :setup, error: "This is a duplicate of a log in your file"), :count).by(20)
end
end
end end
describe "#create_logs?" do describe "#create_logs?" do

12
spec/services/bulk_upload/sales/year2022/row_parser_spec.rb

@ -832,4 +832,16 @@ RSpec.describe BulkUpload::Sales::Year2022::RowParser do
end end
end end
end end
describe "#spreadsheet_duplicate_hash" do
it "returns a hash" do
expect(parser.spreadsheet_duplicate_hash).to be_a(Hash)
end
end
describe "#add_duplicate_found_in_spreadsheet_errors" do
it "adds errors" do
expect { parser.add_duplicate_found_in_spreadsheet_errors }.to change(parser.errors, :size)
end
end
end end

12
spec/services/bulk_upload/sales/year2023/row_parser_spec.rb

@ -1081,4 +1081,16 @@ RSpec.describe BulkUpload::Sales::Year2023::RowParser do
end end
end end
end end
describe "#spreadsheet_duplicate_hash" do
it "returns a hash" do
expect(parser.spreadsheet_duplicate_hash).to be_a(Hash)
end
end
describe "#add_duplicate_found_in_spreadsheet_errors" do
it "adds errors" do
expect { parser.add_duplicate_found_in_spreadsheet_errors }.to change(parser.errors, :size)
end
end
end end

2
spec/services/csv/sales_log_csv_service_spec.rb

@ -3,7 +3,7 @@ require "rails_helper"
RSpec.describe Csv::SalesLogCsvService do RSpec.describe Csv::SalesLogCsvService do
let(:form_handler_mock) { instance_double(FormHandler) } let(:form_handler_mock) { instance_double(FormHandler) }
let(:organisation) { create(:organisation) } let(:organisation) { create(:organisation) }
let!(:log) { create(:sales_log, :completed, owning_organisation: organisation) } let!(:log) { create(:sales_log, :completed, owning_organisation: organisation, purchid: nil) }
let(:service) { described_class.new(export_type: "labels") } let(:service) { described_class.new(export_type: "labels") }
let(:csv) { CSV.parse(service.prepare_csv(SalesLog.all)) } let(:csv) { CSV.parse(service.prepare_csv(SalesLog.all)) }

Loading…
Cancel
Save