canvas-lms/lib/user_merge.rb

476 lines
21 KiB
Ruby

#
# Copyright (C) 2013 - present Instructure, Inc.
#
# This file is part of Canvas.
#
# Canvas is free software: you can redistribute it and/or modify it under
# the terms of the GNU Affero General Public License as published by the Free
# Software Foundation, version 3 of the License.
#
# Canvas is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
# A PARTICULAR PURPOSE. See the GNU Affero General Public License for more
# details.
#
# You should have received a copy of the GNU Affero General Public License along
# with this program. If not, see <http://www.gnu.org/licenses/>.
class UserMerge
def self.from(user)
new(user)
end
attr_reader :from_user
def initialize(from_user)
@from_user = from_user
end
def into(target_user)
return unless target_user
return if target_user == from_user
user_merge_data = target_user.shard.activate do
UserMergeData.create!(user: target_user, from_user: from_user)
end
if target_user.avatar_state == :none && from_user.avatar_state != :none
[:avatar_image_source, :avatar_image_url, :avatar_image_updated_at, :avatar_state].each do |attr|
target_user[attr] = from_user[attr]
end
end
target_user.save if target_user.changed?
[:strong, :weak, :shadow].each do |strength|
from_user.associated_shards(strength).each do |shard|
target_user.associate_with_shard(shard, strength)
end
end
handle_communication_channels(target_user, user_merge_data)
destroy_conflicting_module_progressions(@from_user, target_user)
move_enrollments(target_user, user_merge_data)
Shard.with_each_shard(from_user.associated_shards + from_user.associated_shards(:weak) + from_user.associated_shards(:shadow)) do
max_position = Pseudonym.where(user_id: target_user).order(:position).last.try(:position) || 0
pseudonyms_to_move = Pseudonym.where(user_id: from_user)
user_merge_data.add_more_data(pseudonyms_to_move)
pseudonyms_to_move.update_all(["user_id=?, position=position+?", target_user, max_position])
target_user.communication_channels.email.unretired.each do |cc|
Rails.cache.delete([cc.path, 'invited_enrollments2'].cache_key)
end
[
[:assignment_id, :submissions],
[:quiz_id, :'quizzes/quiz_submissions']
].each do |unique_id, table|
begin
# Submissions are a special case since there's a unique index
# on the table, and if both the old user and the new user
# have a submission for the same assignment there will be
# a conflict.
model = table.to_s.classify.constantize
already_scope = model.where(:user_id => target_user)
scope = model.where(:user_id => from_user)
if model.name == "Submission"
# we prefer submissions that have grades then submissions that have
# a submission... that sort of makes sense.
# we swap empty objects in cases of collision so that we don't
# end up causing a unique index violation for a given assignment for
# the either user, but also so we don't destroy submissions in case
# of a user split.
to_move_ids = scope.graded.select(unique_id).where.not(unique_id => already_scope.graded.select(unique_id)).pluck(:id)
to_move_ids += scope.having_submission.select(unique_id).where.not(unique_id => already_scope.having_submission.select(unique_id), id: to_move_ids).pluck(:id)
to_move = scope.where(id: to_move_ids).to_a
move_back = already_scope.where(unique_id => to_move.map(&unique_id)).to_a
user_merge_data.add_more_data(to_move)
user_merge_data.add_more_data(move_back)
model.transaction do
# there is a unique index on assignment_id and user_id. Unique
# indexes are checked after every row during an update statement
# to get around this and to allow us to swap we are setting the
# user_id to the negative user_id and then the user_id, after the
# conflicting rows have been updated.
model.connection.execute("SET CONSTRAINTS #{model.connection.quote_table_name('fk_rails_8d85741475')} DEFERRED")
model.where(id: move_back).update_all(user_id: -from_user.id)
model.where(id: to_move_ids).update_all(user_id: target_user.id)
model.where(id: move_back).update_all(user_id: from_user.id)
update_versions(from_user, target_user, model.where(id: to_move), table, :user_id)
update_versions(target_user, from_user, model.where(id: move_back), table, :user_id)
end
elsif model.name == "Quizzes::QuizSubmission"
subscope = already_scope.to_a
to_move = model.where(user_id: from_user).joins(:submission).where(submissions: {user_id: target_user}).to_a
move_back = model.where(user_id: target_user).joins(:submission).where(submissions: {user_id: from_user}).to_a
to_move += scope.where("#{unique_id} NOT IN (?)", [subscope.map(&unique_id), move_back.map(&unique_id)].flatten).to_a
move_back += already_scope.where(unique_id => to_move.map(&unique_id)).to_a
user_merge_data.add_more_data(to_move)
user_merge_data.add_more_data(move_back)
model.transaction do
model.connection.execute("SET CONSTRAINTS #{model.connection.quote_table_name('fk_rails_04850db4b4')} DEFERRED")
model.where(id: move_back).update_all(user_id: -from_user.id)
model.where(id: to_move).update_all(user_id: target_user.id)
model.where(id: move_back).update_all(user_id: from_user.id)
update_versions(from_user, target_user, model.where(id: to_move), table, :user_id)
update_versions(target_user, from_user, model.where(id: move_back), table, :user_id)
end
end
rescue => e
Rails.logger.error "migrating #{table} column user_id failed: #{e}"
end
end
from_user.all_conversations.find_each { |c| c.move_to_user(target_user) }
# all topics changing ownership or with entries changing ownership need to be
# flagged as updated so the materialized views update
begin
entries = DiscussionEntry.where(user_id: from_user)
DiscussionTopic.where(id: entries.select(['discussion_topic_id'])).touch_all
entries.update_all(user_id: target_user.id)
DiscussionTopic.where(user_id: from_user).update_all(user_id: target_user.id, updated_at: Time.now.utc)
rescue => e
Rails.logger.error "migrating discussions failed: #{e}"
end
account_users = AccountUser.where(user_id: from_user)
user_merge_data.add_more_data(account_users)
account_users.update_all(user_id: target_user.id)
attachments = Attachment.where(user_id: from_user)
user_merge_data.add_more_data(attachments)
Attachment.send_later(:migrate_attachments, from_user, target_user)
updates = {}
['access_tokens', 'asset_user_accesses',
'calendar_events', 'collaborations',
'context_module_progressions',
'group_memberships', 'page_comments',
'rubric_assessments',
'user_services', 'web_conferences',
'web_conference_participants', 'wiki_pages'].each do |key|
updates[key] = "user_id"
end
updates['submission_comments'] = 'author_id'
updates['conversation_messages'] = 'author_id'
updates = updates.to_a
version_updates = ['rubric_assessments', 'wiki_pages']
updates.each do |table, column|
begin
klass = table.classify.constantize
if klass.new.respond_to?("#{column}=".to_sym)
scope = klass.where(column => from_user)
klass.transaction do
if version_updates.include?(table)
update_versions(from_user, target_user, scope, table, column)
end
scope.update_all(column => target_user.id)
end
end
rescue => e
Rails.logger.error "migrating #{table} column #{column} failed: #{e}"
end
end
context_updates = ['calendar_events']
context_updates.each do |table|
klass = table.classify.constantize
klass.where(context_id: from_user, context_type: 'User').
update_all(context_id: target_user.id, context_code: target_user.asset_string)
end
unless Shard.current != target_user.shard
move_observees(target_user, user_merge_data)
end
Enrollment.send_later(:recompute_due_dates_and_scores, target_user.id)
target_user.update_account_associations
end
from_user.reload
target_user.touch
from_user.destroy
end
def handle_communication_channels(target_user, user_merge_data)
max_position = target_user.communication_channels.last.try(:position) || 0
to_retire_ids = []
known_ccs = target_user.communication_channels.pluck(:id)
from_user.communication_channels.each do |cc|
# have to find conflicting CCs, and make sure we don't have conflicts
target_cc = detect_conflicting_cc(cc, target_user)
if !target_cc && from_user.shard != target_user.shard
User.clone_communication_channel(cc, target_user, max_position)
new_cc = target_user.communication_channels.where.not(id: known_ccs).take
known_ccs << new_cc.id
user_merge_data.add_more_data([new_cc], user: target_user, workflow_state: 'non_existent')
end
next unless target_cc
to_retire = handle_conflicting_ccs(cc, target_cc, target_user, max_position)
to_retire_ids << to_retire.id if to_retire
end
finish_ccs(max_position, target_user, to_retire_ids, user_merge_data)
end
def detect_conflicting_cc(source_cc, target_user)
target_user.communication_channels.detect do |c|
c.path.downcase == source_cc.path.downcase && c.path_type == source_cc.path_type
end
end
def finish_ccs(max_position, target_user, to_retire_ids, user_merge_data)
if from_user.shard != target_user.shard
handle_cross_shard_cc(target_user, user_merge_data)
else
from_user.shard.activate do
ccs = CommunicationChannel.where(id: to_retire_ids).where.not(workflow_state: 'retired')
user_merge_data.add_more_data(ccs) unless to_retire_ids.empty?
ccs.update_all(workflow_state: 'retired') unless to_retire_ids.empty?
end
scope = from_user.communication_channels.where.not(workflow_state: 'retired')
scope = scope.where.not(id: to_retire_ids) unless to_retire_ids.empty?
unless scope.empty?
user_merge_data.add_more_data(scope)
scope.update_all(["user_id=?, position=position+?", target_user, max_position])
end
end
end
def handle_cross_shard_cc(target_user, user_merge_data)
ccs = from_user.communication_channels.where.not(workflow_state: 'retired')
user_merge_data.add_more_data(ccs) unless ccs.empty?
ccs.update_all(workflow_state: 'retired') unless ccs.empty?
from_user.user_services.each do |us|
new_us = us.clone
new_us.shard = target_user.shard
new_us.user = target_user
new_us.save!
user_merge_data.add_more_data([new_us], user: target_user, workflow_state: 'non_existent')
end
user_merge_data.add_more_data(from_user.user_services)
from_user.user_services.delete_all
end
def handle_conflicting_ccs(source_cc, target_cc, target_user, max_position)
# we prefer keeping the "most" active one, preferring the target user if they're equal
# the comments inline show all the different cases, with the source cc on the left,
# target cc on the right. The * indicates the CC that will be retired in order
# to resolve the conflict
if target_cc.active?
# retired, active
# unconfirmed*, active
# active*, active
to_retire = source_cc
elsif source_cc.active?
# active, unconfirmed*
# active, retired
# target_cc will not be able to be restored on split, but it is either unconfirmed or retired so nbd
target_cc.destroy_permanently!
if from_user.shard != target_user.shard
User.clone_communication_channel(source_cc, target_user, max_position)
end
elsif target_cc.unconfirmed?
# unconfirmed*, unconfirmed
# retired, unconfirmed
to_retire = source_cc
elsif source_cc.unconfirmed?
# unconfirmed, retired
# target_cc will not be able to be restored on split, but it is either unconfirmed or retired so nbd
target_cc.destroy_permanently!
if from_user.shard != target_user.shard
User.clone_communication_channel(source_cc, target_user, max_position)
end
elsif
# retired, retired
to_retire = source_cc
end
to_retire
end
def move_observees(target_user, user_merge_data)
# record all the records before destroying them
# pass the from_user since user_id will be the observer
user_merge_data.add_more_data(from_user.as_observer_observation_links, user: from_user)
user_merge_data.add_more_data(from_user.as_student_observation_links)
# delete duplicate or invalid observers/observees, move the rest
from_user.as_observer_observation_links.where(user_id: target_user.as_observer_observation_links.map(&:user_id)).destroy_all
from_user.as_observer_observation_links.where(user_id: target_user).destroy_all
user_merge_data.add_more_data(target_user.as_observer_observation_links.where(user_id: from_user), user: target_user)
target_user.as_observer_observation_links.where(user_id: from_user).destroy_all
from_user.as_observer_observation_links.update_all(observer_id: target_user.id)
xor_observer_ids = UserObservationLink.where(student: [from_user, target_user]).distinct.pluck(:observer_id)
from_user.as_student_observation_links.where(observer_id: target_user.as_student_observation_links.map(&:observer_id)).destroy_all
from_user.as_student_observation_links.update_all(user_id: target_user.id)
# for any observers not already watching both users, make sure they have
# any missing observer enrollments added
target_user.as_student_observation_links.where(observer_id: xor_observer_ids).each(&:create_linked_enrollments)
end
def destroy_conflicting_module_progressions(from_user, target_user)
# there is a unique index on the context_module_progressions table
# we need to delete all the conflicting context_module_progressions
# without impacting the users module progress and without having to
# recalculate the progressions.
# find all the modules progressions and delete the most restrictive
# context_module_progressions
ContextModuleProgression.
where("context_module_progressions.user_id = ?", from_user.id).
where("EXISTS (SELECT *
FROM #{ContextModuleProgression.quoted_table_name} cmp2
WHERE context_module_progressions.context_module_id=cmp2.context_module_id
AND cmp2.user_id = ?)", target_user.id).find_each do |cmp|
ContextModuleProgression.
where(context_module_id: cmp.context_module_id, user_id: [from_user, target_user]).
order(Arel.sql("CASE WHEN workflow_state = 'completed' THEN 0
WHEN workflow_state = 'started' THEN 1
WHEN workflow_state = 'unlocked' THEN 2
WHEN workflow_state = 'locked' THEN 3
END DESC")).first.destroy
end
end
def conflict_scope(column)
other_column = (column == :user_id) ? :associated_user_id : :user_id
Enrollment.
select("type, role_id, course_section_id, #{other_column}").
group("type, role_id, course_section_id, #{other_column}").
having("COUNT(*) > 1")
end
def enrollment_conflicts(enrollment, column, users)
scope = Enrollment.
where(type: enrollment.type,
role_id: enrollment.role_id,
course_section_id: enrollment.course_section_id)
if column == :user_id
scope = scope.where(user_id: users, associated_user_id: enrollment.associated_user_id)
else
scope = scope.where(user_id: enrollment.user_id, associated_user_id: users)
end
scope
end
def enrollment_keeper(scope)
# prefer active enrollments to have no impact to the end user.
# then just keep the newest one.
scope.order(Arel.sql("CASE WHEN workflow_state='active' THEN 1
WHEN workflow_state='invited' THEN 2
WHEN workflow_state='creation_pending' THEN 3
WHEN workflow_state='completed' THEN 4
WHEN workflow_state='rejected' THEN 5
WHEN workflow_state='inactive' THEN 6
WHEN workflow_state='deleted' THEN 7
ELSE 8
END, updated_at DESC")).first
end
def update_enrollment_state(scope, keeper, user_merge_data)
# record both records state sicne both will change
user_merge_data.add_more_data(scope)
# update the record on the target user to the better state of the from users enrollment
enrollment_ids = Enrollment.where(id: scope).where.not(id: keeper).pluck(:id)
Enrollment.where(:id => enrollment_ids).update_all(workflow_state: keeper.workflow_state)
EnrollmentState.force_recalculation(enrollment_ids)
# mark the would be keeper from the from_user as deleted so it will not be moved later
keeper.destroy
end
def handle_conflicts(column, target_user, user_merge_data)
users = [from_user, target_user]
# get each pair of conflicts and "handle them"
conflict_scope(column).where(column => users).find_each do |e|
# identify the other record that is conflicting with this one.
scope = enrollment_conflicts(e, column, users)
# get the highest state between the 2 users enrollments
keeper = enrollment_keeper(scope)
# identify if the target_users record needs promoted to better state
to_update = scope.where.not(id: keeper).where(column => target_user)
# if the target_users enrollment state will be updated pass the scope so
# both target and from users records will be recorded in case of a split.
update_enrollment_state(scope, keeper, user_merge_data) if to_update.exists?
# identify if the from users records are worse states than target user
to_delete = scope.active.where.not(id: keeper).where(column => from_user)
# record the current state in case of split
user_merge_data.add_more_data(to_delete)
# mark all conflicts on from_user as deleted so they will not be moved later
to_delete.destroy_all
end
end
def remove_self_observers(target_user, user_merge_data)
# prevent observing self by marking them as deleted
to_delete = Enrollment.active.where("type = 'ObserverEnrollment' AND
(associated_user_id = :target_user AND user_id = :from_user OR
associated_user_id = :from_user AND user_id = :target_user)",
{target_user: target_user, from_user: from_user})
user_merge_data.add_more_data(to_delete)
to_delete.destroy_all
end
def move_enrollments(target_user, user_merge_data)
[:associated_user_id, :user_id].each do |column|
Shard.with_each_shard(from_user.associated_shards) do
Enrollment.transaction do
handle_conflicts(column, target_user, user_merge_data)
remove_self_observers(target_user, user_merge_data)
# move all the enrollments that have not been marked as deleted to the target user
to_move = Enrollment.active.where(column => from_user)
user_merge_data.add_more_data(to_move)
to_move.update_all(column => target_user.id)
end
end
end
end
def update_versions(from_user, target_user, scope, table, column)
scope.find_ids_in_batches do |ids|
versionable_type = table.to_s.classify
# TODO: This is a hack to support namespacing
versionable_type = ['QuizSubmission', 'Quizzes::QuizSubmission'] if table.to_s == 'quizzes/quiz_submissions'
version_ids = []
Version.where(:versionable_type => versionable_type, :versionable_id => ids).find_each do |version|
begin
version_attrs = YAML.load(version.yaml)
if version_attrs[column.to_s] == from_user.id
version_attrs[column.to_s] = target_user.id
end
# i'm pretty sure simply_versioned just stores fields as strings, but
# i haven't had time to verify that 100% yet, so better safe than sorry
if version_attrs[column.to_sym] == from_user.id
version_attrs[column.to_sym] = target_user.id
end
version.yaml = version_attrs.to_yaml
version.save!
if versionable_type == 'Submission'
version_ids << version.id
end
rescue => e
Rails.logger.error "migrating versions for #{table} column #{column} failed: #{e}"
raise e unless Rails.env.production?
end
end
if version_ids.present?
SubmissionVersion.where(version_id: version_ids, user_id: from_user).update_all(user_id: target_user.id)
end
end
end
end