forked from CenterForOpenScience/osf.io
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
add management command to migrate preprint affiliations
- Loading branch information
John Tordoff
committed
Oct 31, 2024
1 parent
9394a0f
commit 56c466c
Showing
2 changed files
with
203 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,96 @@ | ||
import datetime | ||
import logging | ||
|
||
from django.core.management.base import BaseCommand | ||
from django.db import transaction | ||
from osf.models import PreprintContributor | ||
from django.db.models import F, Count | ||
|
||
logger = logging.getLogger(__name__) | ||
|
||
|
||
class Command(BaseCommand): | ||
"""Assign affiliations from users to preprints where they have write or admin permissions, with optional exclusion by user GUIDs.""" | ||
|
||
help = 'Assign affiliations from users to preprints where they have write or admin permissions.' | ||
|
||
def add_arguments(self, parser): | ||
parser.add_argument( | ||
'--exclude-guids', | ||
nargs='+', | ||
dest='exclude_guids', | ||
help='List of user GUIDs to exclude from affiliation assignment' | ||
) | ||
parser.add_argument( | ||
'--dry-run', | ||
action='store_true', | ||
dest='dry_run', | ||
help='If true, performs a dry run without making changes' | ||
) | ||
|
||
def handle(self, *args, **options): | ||
start_time = datetime.datetime.now() | ||
logger.info(f'Script started at: {start_time}') | ||
|
||
exclude_guids = set(options.get('exclude_guids') or []) | ||
dry_run = options.get('dry_run', False) | ||
|
||
if dry_run: | ||
logger.info('Dry run mode activated.') | ||
|
||
processed_count, updated_count, skipped_count = assign_affiliations_to_preprints( | ||
exclude_guids=exclude_guids, | ||
dry_run=dry_run | ||
) | ||
|
||
finish_time = datetime.datetime.now() | ||
logger.info(f'Script finished at: {finish_time}') | ||
logger.info(f'Total processed: {processed_count}, Updated: {updated_count}, Skipped: {skipped_count}') | ||
logger.info(f'Total run time: {finish_time - start_time}') | ||
|
||
|
||
def assign_affiliations_to_preprints(exclude_guids=None, dry_run=True): | ||
exclude_guids = exclude_guids or set() | ||
contributors = PreprintContributor.objects.filter( | ||
preprint__preprintgroupobjectpermission__permission__codename__in=['write_preprint', 'admin_preprint'], | ||
preprint__preprintgroupobjectpermission__group__user=F('user'), | ||
).annotate( | ||
num_affiliations=Count('user__institutionaffiliation') | ||
).filter( | ||
num_affiliations__gt=0 # Exclude users with no affiliations | ||
).select_related( | ||
'user', | ||
'preprint' | ||
).exclude( | ||
user__guids___id__in=exclude_guids | ||
).distinct() | ||
|
||
processed_count = updated_count = skipped_count = 0 | ||
|
||
with transaction.atomic(): | ||
for contributor in contributors: | ||
user = contributor.user | ||
preprint = contributor.preprint | ||
|
||
user_institutions = set(user.get_affiliated_institutions()) | ||
preprint_institutions = set(preprint.affiliated_institutions.all()) | ||
|
||
new_institutions = user_institutions - preprint_institutions | ||
|
||
if new_institutions: | ||
processed_count += 1 | ||
if not dry_run: | ||
for institution in new_institutions: | ||
preprint.affiliated_institutions.add(institution) | ||
updated_count += 1 | ||
logger.info( | ||
f'Assigned {len(new_institutions)} affiliations from user <{user._id}> to preprint <{preprint._id}>.' | ||
) | ||
else: | ||
logger.info( | ||
f'Dry run: Would assign {len(new_institutions)} affiliations from user <{user._id}> to preprint <{preprint._id}>.' | ||
) | ||
else: | ||
skipped_count += 1 | ||
|
||
return processed_count, updated_count, skipped_count |
107 changes: 107 additions & 0 deletions
107
osf_tests/management_commands/test_migrate_preprint_affiliations.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,107 @@ | ||
import pytest | ||
from osf.management.commands.migrate_preprint_affiliation import assign_affiliations_to_preprints | ||
from osf_tests.factories import ( | ||
PreprintFactory, | ||
InstitutionFactory, | ||
AuthUserFactory, | ||
) | ||
|
||
|
||
@pytest.mark.django_db | ||
class TestAssignAffiliationsToPreprints: | ||
|
||
@pytest.fixture() | ||
def institution(self): | ||
return InstitutionFactory() | ||
|
||
@pytest.fixture() | ||
def user_with_affiliation(self, institution): | ||
user = AuthUserFactory() | ||
user.add_or_update_affiliated_institution(institution) | ||
user.save() | ||
return user | ||
|
||
@pytest.fixture() | ||
def user_without_affiliation(self): | ||
return AuthUserFactory() | ||
|
||
@pytest.fixture() | ||
def preprint_with_affiliated_contributor(self, user_with_affiliation): | ||
preprint = PreprintFactory() | ||
preprint.add_contributor( | ||
user_with_affiliation, | ||
permissions='admin', | ||
visible=True | ||
) | ||
return preprint | ||
|
||
@pytest.fixture() | ||
def preprint_with_non_affiliated_contributor(self, user_without_affiliation): | ||
preprint = PreprintFactory() | ||
preprint.add_contributor( | ||
user_without_affiliation, | ||
permissions='admin', | ||
visible=True | ||
) | ||
return preprint | ||
|
||
@pytest.mark.parametrize('dry_run', [True, False]) | ||
def test_assign_affiliations_with_affiliated_contributor(self, preprint_with_affiliated_contributor, institution, dry_run): | ||
preprint = preprint_with_affiliated_contributor | ||
preprint.affiliated_institutions.clear() | ||
preprint.save() | ||
|
||
assign_affiliations_to_preprints(dry_run=dry_run) | ||
|
||
if dry_run: | ||
assert not preprint.affiliated_institutions.exists() | ||
else: | ||
assert institution in preprint.affiliated_institutions.all() | ||
|
||
@pytest.mark.parametrize('dry_run', [True, False]) | ||
def test_no_affiliations_for_non_affiliated_contributor(self, preprint_with_non_affiliated_contributor, dry_run): | ||
preprint = preprint_with_non_affiliated_contributor | ||
preprint.affiliated_institutions.clear() | ||
preprint.save() | ||
|
||
assign_affiliations_to_preprints(dry_run=dry_run) | ||
|
||
assert not preprint.affiliated_institutions.exists() | ||
|
||
@pytest.mark.parametrize('dry_run', [True, False]) | ||
def test_exclude_contributor_by_guid(self, preprint_with_affiliated_contributor, institution, dry_run): | ||
preprint = preprint_with_affiliated_contributor | ||
preprint.affiliated_institutions.clear() | ||
preprint.save() | ||
|
||
assert preprint.contributors.last().get_affiliated_institutions() | ||
exclude_guids = {user._id for user in preprint.contributors.all()} | ||
|
||
assign_affiliations_to_preprints(exclude_guids=exclude_guids, dry_run=dry_run) | ||
|
||
assert not preprint.affiliated_institutions.exists() | ||
|
||
@pytest.mark.parametrize('dry_run', [True, False]) | ||
def test_affiliations_from_multiple_contributors(self, institution, dry_run): | ||
user1 = AuthUserFactory() | ||
user1.add_or_update_affiliated_institution(institution) | ||
user1.save() | ||
|
||
user2 = AuthUserFactory() | ||
institution2 = InstitutionFactory() | ||
user2.add_or_update_affiliated_institution(institution2) | ||
user2.save() | ||
|
||
preprint = PreprintFactory() | ||
preprint.affiliated_institutions.clear() | ||
preprint.add_contributor(user1, permissions='write', visible=True) | ||
preprint.add_contributor(user2, permissions='admin', visible=True) | ||
preprint.save() | ||
|
||
assign_affiliations_to_preprints(dry_run=dry_run) | ||
|
||
if dry_run: | ||
assert not preprint.affiliated_institutions.exists() | ||
else: | ||
affiliations = set(preprint.affiliated_institutions.all()) | ||
assert affiliations == {institution, institution2} |