cjcolvar/gist:1ca9326120e99ab1bddde0f66c4877fc

## gistfile1.txt
module ActiveFedora
  module Indexing
    # Finds all descendent URIs of a given repo URI (usually the base URI).
    #
    # This is a slow and non-performant thing to do, we need to fetch every single
    # object from the repo.
    #
    # The DescendantFetcher is also capable of partitioning the URIs into "priority" URIs
    # that will be first in the returned list. These prioritized URIs belong to objects
    # with certain hasModel models. This feature is used in some hydra apps that need to
    # index 'permissions' objects before other objects to have the solr indexing work right.
    # And so by default, the prioritized class names are the ones form Hydra::AccessControls,
    # but you can alter the prioritized model name list, or set it to the empty array.
    #
    #     DescendantFetcher.new(ActiveFedora.fedora.base_uri).descendent_and_self_uris
    #     #=> array including self uri and descendent uris with "prioritized" (by default)
    #         Hydra::AccessControls permissions) objects FIRST.
    #
    # Change the default prioritized hasModel names:
    #
    #     ActiveFedora::Indexing::DescendantFetcher.default_priority_models = []
    class AvalonDescendantFetcher
      HAS_MODEL_PREDICATE = ActiveFedora::RDF::Fcrepo::Model.hasModel

      class_attribute :default_priority_models, instance_accessor: false
      self.default_priority_models = %w(Hydra::AccessControl Hydra::AccessControl::Permissions).freeze

      attr_reader :uri, :priority_models

      def initialize(uri,
                     priority_models: self.class.default_priority_models, exclude_self: false, recursive: true)
        @uri = uri
        @priority_models = priority_models
        @exclude_self = exclude_self
        @recursive = recursive
      end

      def descendant_and_self_uris
        partitioned = descendant_and_self_uris_partitioned
        partitioned.values.flatten
      end

      # returns a hash where key :priority is an array of all prioritized
      # type objects, key :other is an array of the rest.
      def descendant_and_self_uris_partitioned
        resource = Ldp::Resource::RdfSource.new(ActiveFedora.fedora.connection, uri)
        # GET could be slow if it's a big resource, we're using HEAD to avoid this problem,
        # but this causes more requests to Fedora.
        return partitioned_uris unless resource.head.rdf_source?

        add_self_to_partitioned_uris unless @exclude_self
        return partitioned_uris unless @recursive

        immediate_descendant_uris = rdf_graph.query(predicate: ::RDF::Vocab::LDP.contains).map { |descendant| descendant.object.to_s }
        immediate_descendant_uris.each do |descendant_uri|
          self.class.new(
            descendant_uri,
            priority_models: priority_models,
            recursive: pair_tree_object? || is_root_object?
          ).descendant_and_self_uris_partitioned.tap do |descendant_partitioned|
            descendant_partitioned.keys.each do |k|
              partitioned_uris[k] ||= []
              partitioned_uris[k].concat descendant_partitioned[k]
            end
          end
        end
        partitioned_uris
      end

      protected

        def rdf_resource
          @rdf_resource ||= Ldp::Resource::RdfSource.new(ActiveFedora.fedora.connection, uri)
        end

        def rdf_graph
          @rdf_graph ||= rdf_resource.graph
        end

        def partitioned_uris
          @partitioned_uris ||= {
          }
        end

        def rdf_graph_models
          rdf_graph.query(predicate: HAS_MODEL_PREDICATE).collect(&:object).collect do |rdf_object|
            rdf_object.to_s if rdf_object.literal?
          end.compact
        end

        def rdf_types
          rdf_graph.query(predicate: ::RDF.type).collect(&:object).collect do |rdf_object|
            rdf_object.to_s
          end.compact
        end

        def pair_tree_object?
          rdf_types.include? "http://fedora.info/definitions/v4/repository#Pairtree"
        end

        def is_root_object?
          rdf_resource.subject == ActiveFedora.fedora.base_uri
        end

        def add_self_to_partitioned_uris
           rdf_graph_models.each do |model|
             next unless priority_models.include?(model)
             partitioned_uris[model] ||= []
             partitioned_uris[model] << rdf_resource.subject
           end
        end
    end
  end
end
	module ActiveFedora
	module Indexing
	# Finds all descendent URIs of a given repo URI (usually the base URI).
	#
	# This is a slow and non-performant thing to do, we need to fetch every single
	# object from the repo.
	#
	# The DescendantFetcher is also capable of partitioning the URIs into "priority" URIs
	# that will be first in the returned list. These prioritized URIs belong to objects
	# with certain hasModel models. This feature is used in some hydra apps that need to
	# index 'permissions' objects before other objects to have the solr indexing work right.
	# And so by default, the prioritized class names are the ones form Hydra::AccessControls,
	# but you can alter the prioritized model name list, or set it to the empty array.
	#
	# DescendantFetcher.new(ActiveFedora.fedora.base_uri).descendent_and_self_uris
	# #=> array including self uri and descendent uris with "prioritized" (by default)
	# Hydra::AccessControls permissions) objects FIRST.
	#
	# Change the default prioritized hasModel names:
	#
	# ActiveFedora::Indexing::DescendantFetcher.default_priority_models = []
	class AvalonDescendantFetcher
	HAS_MODEL_PREDICATE = ActiveFedora::RDF::Fcrepo::Model.hasModel

	class_attribute :default_priority_models, instance_accessor: false
	self.default_priority_models = %w(Hydra::AccessControl Hydra::AccessControl::Permissions).freeze

	attr_reader :uri, :priority_models

	def initialize(uri,
	priority_models: self.class.default_priority_models, exclude_self: false, recursive: true)
	@uri = uri
	@priority_models = priority_models
	@exclude_self = exclude_self
	@recursive = recursive
	end

	def descendant_and_self_uris
	partitioned = descendant_and_self_uris_partitioned
	partitioned.values.flatten
	end

	# returns a hash where key :priority is an array of all prioritized
	# type objects, key :other is an array of the rest.
	def descendant_and_self_uris_partitioned
	resource = Ldp::Resource::RdfSource.new(ActiveFedora.fedora.connection, uri)
	# GET could be slow if it's a big resource, we're using HEAD to avoid this problem,
	# but this causes more requests to Fedora.
	return partitioned_uris unless resource.head.rdf_source?

	add_self_to_partitioned_uris unless @exclude_self
	return partitioned_uris unless @recursive

	immediate_descendant_uris = rdf_graph.query(predicate: ::RDF::Vocab::LDP.contains).map { \|descendant\| descendant.object.to_s }
	immediate_descendant_uris.each do \|descendant_uri\|
	self.class.new(
	descendant_uri,
	priority_models: priority_models,
	recursive: pair_tree_object? \|\| is_root_object?
	).descendant_and_self_uris_partitioned.tap do \|descendant_partitioned\|
	descendant_partitioned.keys.each do \|k\|
	partitioned_uris[k] \|\|= []
	partitioned_uris[k].concat descendant_partitioned[k]
	end
	end
	end
	partitioned_uris
	end

	protected

	def rdf_resource
	@rdf_resource \|\|= Ldp::Resource::RdfSource.new(ActiveFedora.fedora.connection, uri)
	end

	def rdf_graph
	@rdf_graph \|\|= rdf_resource.graph
	end

	def partitioned_uris
	@partitioned_uris \|\|= {
	}
	end

	def rdf_graph_models
	rdf_graph.query(predicate: HAS_MODEL_PREDICATE).collect(&:object).collect do \|rdf_object\|
	rdf_object.to_s if rdf_object.literal?
	end.compact
	end

	def rdf_types
	rdf_graph.query(predicate: ::RDF.type).collect(&:object).collect do \|rdf_object\|
	rdf_object.to_s
	end.compact
	end

	def pair_tree_object?
	rdf_types.include? "http://fedora.info/definitions/v4/repository#Pairtree"
	end

	def is_root_object?
	rdf_resource.subject == ActiveFedora.fedora.base_uri
	end

	def add_self_to_partitioned_uris
	rdf_graph_models.each do \|model\|
	next unless priority_models.include?(model)
	partitioned_uris[model] \|\|= []
	partitioned_uris[model] << rdf_resource.subject
	end
	end
	end
	end
	end