Kajabi · bhcastle · Aug 3, 2021 · Aug 3, 2021 · Aug 3, 2021 · Aug 3, 2021
diff --git a/.gitignore b/.gitignore
@@ -20,3 +20,4 @@ tmp
 *.o
 *.a
 mkmf.log
+vendor/*
diff --git a/.rubocop.yml b/.rubocop.yml
@@ -0,0 +1,8 @@
+inherit_from: .rubocop_todo.yml
+
+Style/StringLiterals:
+  EnforcedStyle: "double_quotes"
+
+Metrics/BlockLength:
+  Exclude:
+    - "spec/**/*.rb"
diff --git a/.rubocop_todo.yml b/.rubocop_todo.yml
diff --git a/Gemfile b/Gemfile
@@ -1,4 +1,6 @@
-source 'https://rubygems.org'
+# frozen_string_literal: true
+
+source "https://rubygems.org"
 
 # Specify your gem's dependencies in redis_dedupe.gemspec
 gemspec
diff --git a/Rakefile b/Rakefile
@@ -1,3 +1,4 @@
-require "bundler/gem_tasks"
-Dir.glob('tasks/**/*.rake').each(&method(:import))
+# frozen_string_literal: true
 
+require "bundler/gem_tasks"
+Dir.glob("tasks/**/*.rake").each(&method(:import))
diff --git a/lib/redis_dedupe.rb b/lib/redis_dedupe.rb
@@ -1,64 +1,4 @@
-require 'redis_dedupe/version'
+# frozen_string_literal: true
 
-module RedisDedupe
-  class<<self
-    attr_accessor :client
-  end
-
-  class Set
-    SEVEN_DAYS = 7 * 24 * 60 * 60
-
-    attr_reader :key, :expires_in
-
-    def initialize(redis, key, expires_in = SEVEN_DAYS)
-      @redis      = redis
-      @key        = key
-      @expires_in = expires_in
-    end
-
-    def check(member)
-      results = redis.pipelined do
-        redis.sadd(key, member)
-        redis.expire(key, expires_in)
-      end
-
-      if results[0]
-        yield
-      end
-    end
-
-    def finish
-      redis.del(key)
-    end
-
-    private
-
-    def redis
-      @redis
-    end
-  end
-
-  module Helpers
-    private
-
-    def dedupe
-      @dedupe ||= RedisDedupe::Set.new(RedisDedupe.client, [dedupe_namespace, dedupe_id].join(':'))
-    end
-
-    # Implement in class, should return an integer or string:
-    #
-    # Ex.
-    #
-    #   def dedupe_id
-    #     @announcement.id # => 42
-    #   end
-    #
-    def dedupe_id
-      raise NotImplementedError
-    end
-
-    def dedupe_namespace
-      self.class.name
-    end
-  end
-end
+require "redis_dedupe/set"
+require "redis_dedupe/helpers"
diff --git a/lib/redis_dedupe/helpers.rb b/lib/redis_dedupe/helpers.rb
@@ -0,0 +1,45 @@
+# frozen_string_literal: true
+
+# :nodoc:
+module RedisDedupe
+  #
+  # Include `RedisDedupe::Helpers` to use +RedisDedupe::Set+
+  #
+  # class MyClass
+  #   include RedisDedupe::Helpers
+  #
+  #   private
+  #
+  #   def dedupe_id
+  #     "my_unique_set_key"
+  #   end
+  # end
+  #
+  module Helpers
+    private
+
+    def dedupe
+      @dedupe ||= RedisDedupe::Set.new(RedisDedupe.client, key)
+    end
+
+    def key
+      [dedupe_namespace, dedupe_id].join(":")
+    end
+
+    # Implement in class, should return an integer or string:
+    #
+    # Ex.
+    #
+    #   def dedupe_id
+    #     @announcement.id # => 42
+    #   end
+    #
+    def dedupe_id
+      raise NotImplementedError
+    end
+
+    def dedupe_namespace
+      self.class.name
+    end
+  end
+end
diff --git a/lib/redis_dedupe/set.rb b/lib/redis_dedupe/set.rb
@@ -0,0 +1,103 @@
+# frozen_string_literal: true
+
+# :nodoc:
+module RedisDedupe
+  class << self
+    attr_accessor :client
+  end
+
+  # A mechanism to make sure that a block of code will only be called once for each specified identifier (or +member+)
+  # even if the calling process dies or restarts, as long the datastore is +Redis+-backed.
+  #
+  # @example Keep the set around for 7 days, letting Redis handle its own memory cleanup after that time
+  #   ```
+  #   dedupe = RedisDedupe::Set.new($redis, "send_payment_due_emails")
+  #   Account.all do |account|
+  #     dedupe.check(account.id) do
+  #       mail(to: account.billing_email, subject: "PAY US... NOW!!!")
+  #     end
+  #   end
+  #   ```
+  #
+  # @example If you want to be able to repeat the process at any time immediately following this method
+  #   ```
+  #   dedupe = RedisDedupe::Set.new($redis, "send_welcome_emails")
+  #   Account.all.pluck(:email) do |email|
+  #     dedupe.check(email) { mail(to: email, subject: "Hello!") }
+  #   end
+  #   dedupe.finish
+  #   ```
+  #
+  class Set
+    SEVEN_DAYS = 7 * 24 * 60 * 60
+
+    attr_reader :key, :expires_in
+
+    def initialize(redis, key, expires_in = SEVEN_DAYS)
+      @redis      = redis
+      @key        = key
+      @expires_in = expires_in
+    end
+
+    # Ensures that a block of code will only be run if the +member+ is not already contained in Redis.
+    # ie: the code block has not already run for the specified +member+.
+    #
+    # Note that if the given block raises an error, the +member+ will not remain in the +Set+ and may be tried again.
+    #
+    # @param [String, Integer] member identifiying value to make sure the given block only runs once
+    #
+    # @yield block to run for the specified +member+, which should only be run once for any particular member
+    #
+    # @return `nil` if the block was not run, otherwise the result of the yielded block
+    #
+    def check(member, &block)
+      raise ArgumentError, "passing a block is required" if block.nil?
+      return nil unless execute_block_for_member?(member)
-      return nil unless execute_block_for_member?(member)
+      return if duplicate_request?(member)
-      return nil unless execute_block_for_member?(member)
+      return if duplicate_request?(member)
+
+      begin
+        block.call
+      rescue StandardError => e
+        redis.srem(key, member)
+        raise e
+      end
+    end
+
+    def finish
+      redis.del(key)
+    end
+
+    # Retrieves the member in the set with the largest value.
+    #
+    # This will work on String and Integers, but really meant for Integer
+    # If used for String, make sure it's really doing what you want and expect
+    #
+    # @example with Integers
+    # redis.smembers("foo") => [1, 2, 3, 4, 5]
+    # max_member => 5
+    #
+    # @example with String
+    # redis.smembers("foo") => ["abc", "xyz", "lmn"]
+    # max_member => "xyz"
+    #
+    # @see Array#max
+    #
+    # @return [Integer, String] the member in the set with the largest value
+    #
+    def max_member
+      redis.smembers(key).max
+    end
+
+    private
+
+    attr_reader :redis
+
+    def execute_block_for_member?(member)
+      results = redis.pipelined do
+        redis.sadd(key, member)
+        redis.expire(key, expires_in)
+      end
+
+      results[0] # `results` will be `[true]` or `[false]`
+    end
+  end
+end
diff --git a/lib/redis_dedupe/version.rb b/lib/redis_dedupe/version.rb
@@ -1,3 +1,6 @@
+# frozen_string_literal: true
+
+# :nodoc:
 module RedisDedupe
-  VERSION = "0.0.3"
+  VERSION = "0.0.4"
 end
diff --git a/redis_dedupe.gemspec b/redis_dedupe.gemspec
@@ -1,24 +1,34 @@
-# coding: utf-8
-lib = File.expand_path('../lib', __FILE__)
+# frozen_string_literal: true
+
+lib = File.expand_path("lib", __dir__)
 $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
-require 'redis_dedupe/version'
+require "redis_dedupe/version"
 
 Gem::Specification.new do |spec|
-  spec.name          = "redis_dedupe"
-  spec.version       = RedisDedupe::VERSION
-  spec.authors       = ["Andy Huynh"]
-  spec.email         = ["andy4thehuynh@gmail.com"]
-  spec.summary       = %q{ A weak deduper to make things like bulk email run safer. }
-  spec.description   = %q{ This is a weak deduper to make things like bulk email run safer. It is not a lock safe for financial/security needs because it uses a weak redis locking pattern that can have race conditions. However, imagine a bulk email job that loops over 100 users, and enqueues a background email for each user. If the job fails at iteration 50, a retry would enqueue all the users again and many will receive dupes. This would continue multiple times as the parent job continued to rerun. By marking that a subjob has been enqueued, we can let that isolated job handle its own failures, and the batch enqueue job can run multiple times without re-enqueueing the same subjobs. }
-  spec.homepage      = ""
-  spec.license       = "MIT"
-
-  spec.files         = `git ls-files -z`.split("\x0")
-  spec.executables   = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
-  spec.require_paths = ["lib"]
+  spec.name                   = "redis_dedupe"
+  spec.version                = RedisDedupe::VERSION
+  spec.required_ruby_version  = ">= 2.6.0"
+  spec.authors                = ["Andy Huynh"]
+  spec.email                  = ["andy4thehuynh@gmail.com"]
+  spec.summary                = "A weak deduper to make things like bulk email run safer."
+  spec.homepage               = ""
+  spec.license                = "MIT"
+  spec.files                  = Dir["lib/**/*.rb"] + ["lib/redis_dedupe.rb"]
+  spec.executables            = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
+  spec.require_paths          = ["lib"]
+  spec.description            = <<~EO_DESC
+    This is a weak deduper to make things like bulk email run safer. It is not a lock safe for financial/security needs
+    because it uses a weak redis locking pattern that can have race conditions. However, imagine a bulk email job that
+    loops over 100 users, and enqueues a background email for each user. If the job fails at iteration 50, a retry
+    would enqueue all the users again and many will receive dupes. This would continue multiple times as the parent
+    job continued to rerun. By marking that a subjob has been enqueued, we can let that isolated job handle its own
+    failures, and the batch enqueue job can run multiple times without re-enqueueing the same subjobs.
+  EO_DESC
 
   spec.add_development_dependency "bundler", "~> 1.6"
+  spec.add_development_dependency "mock_redis"
   spec.add_development_dependency "rake"
   spec.add_development_dependency "rspec"
-  spec.add_development_dependency "mock_redis"
+  spec.add_development_dependency "rubocop"
+  spec.add_development_dependency "timecop"
 end
diff --git a/spec/redis_dedupe/helpers_spec.rb b/spec/redis_dedupe/helpers_spec.rb
@@ -0,0 +1,45 @@
+# frozen_string_literal: true
+
+require "mock_redis"
+require "spec_helper"
+
+require "redis_dedupe/helpers"
+
+RSpec.describe RedisDedupe::Helpers do
+  let(:redis)     { MockRedis.new }
+  let(:instance)  { RedisDedupeSpecStubbedClass.new }
+
+  before do
+    allow(RedisDedupe).to receive(:client).and_return(redis)
+  end
+
+  describe "#dedupe" do
+    subject { instance.test_call }
+
+    it { expect(subject).to eq(2) }
+
+    it "uses the correct redis key" do
+      subject
+      expect(redis.smembers("RedisDedupeSpecStubbedClass:just_a_test")).to match_array(%w[5 7])
+    end
+  end
+end
+
+# :nodoc:
+class RedisDedupeSpecStubbedClass
+  include RedisDedupe::Helpers
+
+  def test_call
+    counter = 0
+
+    dedupe.check(5) { counter += 1 }
+    dedupe.check(5) { counter += 1 }
+    dedupe.check(7) { counter += 1 }
+
+    counter
+  end
+
+  def dedupe_id
+    "just_a_test"
+  end
+end
-Original file line number
+Diff line change
@@ Expand Up / @@ -20,3 +20,4 @@ tmp @@
     *.o
     *.a
     mkmf.log
+    vendor/*