Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat: [no merge] spike on replicating content metadata into a model. … #150

Draft
wants to merge 1 commit into
base: main
Choose a base branch
from
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
291 changes: 232 additions & 59 deletions enterprise_subsidy/apps/content_metadata/api.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,13 +6,15 @@
from decimal import Decimal

from django.conf import settings
from django.utils import functional, timezone
from edx_django_utils.cache import TieredCache

from enterprise_subsidy.apps.api_client.enterprise_catalog import EnterpriseCatalogApiClient
from enterprise_subsidy.apps.core.utils import versioned_cache_key
from enterprise_subsidy.apps.subsidy.constants import CENTS_PER_DOLLAR

from .constants import CourseModes, ProductSources
from .models import ReplicatedContentMetadata

logger = logging.getLogger(__name__)

Expand All @@ -34,6 +36,112 @@ def content_metadata_cache_key(enterprise_customer_uuid, content_key):
return versioned_cache_key(CACHE_NAMESPACE, enterprise_customer_uuid, content_key)


def _price_for_content(content_data, course_run_data):
"""
Helper to return the "official" price for content.
The endpoint at ``self.content_metadata_url`` will always return price fields
as USD (dollars), possibly as a string or a float. This method converts
those values to USD cents as an integer.
"""
content_price = None
if course_run_data.get('first_enrollable_paid_seat_price'):
content_price = course_run_data['first_enrollable_paid_seat_price']

if not content_price:
enrollment_mode_for_content = _mode_for_content(content_data)
for entitlement in content_data.get('entitlements', []):
if entitlement.get('mode') == enrollment_mode_for_content:
content_price = entitlement.get('price')

if content_price:
return int(Decimal(content_price) * CENTS_PER_DOLLAR)
else:
logger.info(
f"Could not determine price for content key {content_data.get('key')} "
f"and course run key {course_run_data.get('key')}"
)
return None


def _mode_for_content(content_data):
"""
Helper to extract the relevant enrollment mode for a piece of content metadata.
"""
product_source = _product_source_for_content(content_data)
return CONTENT_MODES_BY_PRODUCT_SOURCE.get(product_source, CourseModes.EDX_VERIFIED.value)


def _product_source_for_content(content_data):
"""
Helps get the product source string, given a dict of ``content_data``.
"""
if product_source := content_data.get('product_source'):
source_name = product_source.get('slug')
if source_name in CONTENT_MODES_BY_PRODUCT_SOURCE:
return source_name
return ProductSources.EDX.value


def _get_geag_variant_id_for_content(content_data):
"""
Returns the GEAG ``variant_id`` or ``None``, given a dict of ``content_data``.
In the GEAG system a ``variant_id`` is aka a ``product_id``.
"""
variant_id = None
if additional_metadata := content_data.get('additional_metadata'):
variant_id = additional_metadata.get('variant_id')
return variant_id


def _get_course_run(content_identifier, content_data):
"""
Given a content_identifier (key, run key, uuid) extract the appropriate course_run.
When given a run key or uuid for a run, extract that. When given a course key or
course uuid, extract the advertised course_run.
"""
if content_data.get('content_type') == 'courserun':
return content_data

course_run_identifier = content_identifier
# if the supplied content_identifer refers to the course, look for an advertised run
if content_identifier == content_data.get('key') or content_identifier == content_data.get('uuid'):
course_run_identifier = content_data.get('advertised_course_run_uuid')
for course_run in content_data.get('course_runs', []):
if course_run_identifier == course_run.get('key') or course_run_identifier == course_run.get('uuid'):
return course_run
return {}


def _get_and_cache_content_metadata(enterprise_customer_uuid, content_identifier):
"""
Fetches details about the given content from a tiered (request + django) cache;
or it fetches from the enterprise-catalog API if not present in the cache,
and then caches that result.
"""
cache_key = content_metadata_cache_key(enterprise_customer_uuid, content_identifier)
cached_response = TieredCache.get_cached_response(cache_key)
if cached_response.is_found:
return cached_response.value

course_details = EnterpriseCatalogApiClient().get_content_metadata_for_customer(
enterprise_customer_uuid,
content_identifier
)
if course_details:
TieredCache.set_all_tiers(
cache_key,
course_details,
django_cache_timeout=CONTENT_METADATA_CACHE_TIMEOUT,
)
logger.info(
'Fetched course details %s for customer %s and content_identifier %s',
course_details,
enterprise_customer_uuid,
content_identifier,
)
return course_details


class ContentMetadataApi:
"""
An API for interacting with enterprise catalog content metadata.
Expand All @@ -54,51 +162,26 @@ def price_for_content(self, content_data, course_run_data):
as USD (dollars), possibly as a string or a float. This method converts
those values to USD cents as an integer.
"""
content_price = None
if course_run_data.get('first_enrollable_paid_seat_price'):
content_price = course_run_data['first_enrollable_paid_seat_price']

if not content_price:
enrollment_mode_for_content = self.mode_for_content(content_data)
for entitlement in content_data.get('entitlements', []):
if entitlement.get('mode') == enrollment_mode_for_content:
content_price = entitlement.get('price')

if content_price:
return int(Decimal(content_price) * CENTS_PER_DOLLAR)
else:
logger.info(
f"Could not determine price for content key {content_data.get('key')} "
f"and course run key {course_run_data.get('key')}"
)
return None
return _price_for_content(content_data, course_run_data)

def mode_for_content(self, content_data):
"""
Helper to extract the relevant enrollment mode for a piece of content metadata.
"""
product_source = self.product_source_for_content(content_data)
return CONTENT_MODES_BY_PRODUCT_SOURCE.get(product_source, CourseModes.EDX_VERIFIED.value)
return _mode_for_content(content_data)

def product_source_for_content(self, content_data):
"""
Helps get the product source string, given a dict of ``content_data``.
"""
if product_source := content_data.get('product_source'):
source_name = product_source.get('slug')
if source_name in CONTENT_MODES_BY_PRODUCT_SOURCE:
return source_name
return ProductSources.EDX.value
return _product_source_for_content(content_data)

def get_geag_variant_id_for_content(self, content_data):
"""
Returns the GEAG ``variant_id`` or ``None``, given a dict of ``content_data``.
In the GEAG system a ``variant_id`` is aka a ``product_id``.
"""
variant_id = None
if additional_metadata := content_data.get('additional_metadata'):
variant_id = additional_metadata.get('variant_id')
return variant_id
return _get_geag_variant_id_for_content(content_data)

def summary_data_for_content(self, content_identifier, content_data):
"""
Expand All @@ -123,17 +206,7 @@ def get_course_run(self, content_identifier, content_data):
When given a run key or uuid for a run, extract that. When given a course key or
course uuid, extract the advertised course_run.
"""
if content_data.get('content_type') == 'courserun':
return content_data

course_run_identifier = content_identifier
# if the supplied content_identifer refers to the course, look for an advertised run
if content_identifier == content_data.get('key') or content_identifier == content_data.get('uuid'):
course_run_identifier = content_data.get('advertised_course_run_uuid')
for course_run in content_data.get('course_runs', []):
if course_run_identifier == course_run.get('key') or course_run_identifier == course_run.get('uuid'):
return course_run
return {}
return _get_course_run(content_identifier, content_data)

def get_content_summary(self, enterprise_customer_uuid, content_identifier):
"""
Expand Down Expand Up @@ -206,25 +279,125 @@ def get_content_metadata(enterprise_customer_uuid, content_identifier):
or it fetches from the enterprise-catalog API if not present in the cache,
and then caches that result.
"""
cache_key = content_metadata_cache_key(enterprise_customer_uuid, content_identifier)
cached_response = TieredCache.get_cached_response(cache_key)
if cached_response.is_found:
return cached_response.value
return _get_and_cache_content_metadata(enterprise_customer_uuid, content_identifier)

course_details = EnterpriseCatalogApiClient().get_content_metadata_for_customer(
enterprise_customer_uuid,
content_identifier

class UpstreamContentMetadata:
"""
Expected interactions with this class:
# given a customer and desired course/run key
enterprise_customer_uuid = 'some-uuid'
content_identifier = 'whatever-course-or-run-key'

# fetches course/run metadata from upstream or cache
metadata_wrapper = UpstreamContentMetadata(enterprise_customer_uuid, content_identifier)
"""
def __init__(self, enterprise_customer_uuid, content_identifier):
self.enterprise_customer_uuid = enterprise_customer_uuid
self.content_identifier = content_identifier
self.raw_metadata = None
self.course_run_data = None
self.fetch()

def fetch(self):
self.raw_metadata = _get_and_cache_content_metadata(
self.enterprise_customer_uuid,
self.content_identifier,
)
if course_details:
TieredCache.set_all_tiers(
cache_key,
course_details,
django_cache_timeout=CONTENT_METADATA_CACHE_TIMEOUT,
)
logger.info(
'Fetched course details %s for customer %s and content_identifier %s',
course_details,
enterprise_customer_uuid,
content_identifier,
self.course_run_data = _get_course_run(self.content_identifier, self.raw_metadata)

@functional.cached_property
def title(self):
self.raw_metadata.get('title')

@functional.cached_property
def price(self):
return _price_for_content(self.raw_metadata, self.course_run_data)

@functional.cached_property
def course_mode(self):
return _mode_for_content(self.raw_metadata)

@functional.cached_property
def product_source(self):
return _product_source_for_content(self.raw_metadata)

@functional.cached_property
def geag_variant_id(self):
return _get_geag_variant_id_for_content(self.raw_metadata)

@functional.cached_property
def content_key(self):
return self.raw_metadata.get('key')

@functional.cached_property
def course_run_key(self):
return self.course_run_data.get('key')

@functional.cached_property
def content_type(self):
return self.raw_metadata.get('content_type')


def test_upstream():
return UpstreamContentMetadata(
enterprise_customer_uuid='378d5bf0-f67d-4bf7-8b2a-cbbc53d0f772',
content_identifier='course-v1:edX+DemoX+Demo_Course',
)


class ContentMetadataReplicator:
"""
"""
def __init__(self, enterprise_customer_uuid, content_identifier):
self.enterprise_customer_uuid = enterprise_customer_uuid
self.content_identifier = content_identifier
self.upstream_data = None

def fetch_upstream(self):
self.upstream_data = UpstreamContentMetadata(
enterprise_customer_uuid=self.enterprise_customer_uuid,
content_identifier=self.content_identifier,
)

def get_recent_metadata_record(self):
return ReplicatedContentMetadata.get_recent_record_or_null(
enterprise_customer_uuid=self.enterprise_customer_uuid,
content_key=self.content_identifier,
)

def _replicate_metadata_record(self):
self.fetch_upstream()
new_values = {
'content_type': self.upstream_data.content_type,
'raw_metadata': self.upstream_data.raw_metadata,
'raw_fetched_at': timezone.now(),
'title': self.upstream_data.title,
'price': self.upstream_data.price,
'product_source': self.upstream_data.product_source,
'course_mode': self.upstream_data.course_mode,
}
record, _ = ReplicatedContentMetadata.objects.update_or_create(
enterprise_customer_uuid=self.enterprise_customer_uuid,
content_key=self.content_identifier,
defaults=new_values,
)
return course_details
return record

def replicate(self):
# Check for a recent replicated record in the DB.
# If we have a good one, return it.
record = self.get_recent_metadata_record()
if record:
return record

# Otherwise, fetch from upstream, replicate, and return
return self._replicate_metadata_record()


def test_replicate():
replicator = ContentMetadataReplicator(
enterprise_customer_uuid='378d5bf0-f67d-4bf7-8b2a-cbbc53d0f772',
content_identifier='course-v1:edX+DemoX+Demo_Course',
)
return replicator.replicate()
Loading