fluffychat/lib/pangea/events/models/representation_content_mode...

import 'package:matrix/matrix.dart';

import 'package:fluffychat/pangea/analytics_misc/construct_type_enum.dart';
import 'package:fluffychat/pangea/analytics_misc/construct_use_type_enum.dart';
import 'package:fluffychat/pangea/analytics_misc/constructs_model.dart';
import 'package:fluffychat/pangea/choreographer/models/choreo_record.dart';
import 'package:fluffychat/pangea/choreographer/models/pangea_match_model.dart';
import 'package:fluffychat/pangea/events/models/pangea_token_model.dart';
import 'package:fluffychat/pangea/toolbar/models/speech_to_text_models.dart';
import 'package:fluffychat/widgets/matrix.dart';

/// this class is contained within a [RepresentationEvent]
/// this event is the child of a [EventTypes.Message]
/// the event has two potential children events -
/// [PangeaTokensEvent] and [PangeaIGCEvent]
/// these events contain [PangeaMessageTokens] and [ChoreoRecord], respectively.
class PangeaRepresentation {
  /// system-detected language, possibly condensed from a list,
  /// but only with high certainty
  /// cannot be "unk"
  String langCode;

  /// final sent text
  /// if this was a process, a [PangeaIGCEvent] will contain changes
  String text;

  bool originalSent;
  bool originalWritten;

  // a representation can be create via speech to text on the original message
  SpeechToTextModel? speechToText;

  // how do we know which representation was sent by author?
  // RepresentationEvent.text == PangeaMessageEvent.event.body
  // use: to know whether directUse

  // how do we know which representation was original L1 message that was translated (if it exists)?
  // (of l2 rep) RepresentationEvent.igc.steps.first.text = RepresentationEvent.text (of L1 rep)
  // use: for base text for future translations

  // os = true and ow = false
  // rep that went through IGC/IT

  // os = false and ow = false
  // rep added by other user

  // os = true and ow = true
  // potentially L1 language use, maybe with limited IGC, and ignored out of target cries
  // potentially perfect L2 use

  // os = false and ow = true
  // L1 message that then went through significant IGC and/or IT
  // L2 message with errors that went through IGC

  PangeaRepresentation({
    required this.langCode,
    required this.text,
    required this.originalSent,
    required this.originalWritten,
    this.speechToText,
  });

  factory PangeaRepresentation.fromJson(Map<String, dynamic> json) {
    return PangeaRepresentation(
      langCode: json[_langCodeKey],
      text: json[_textKey],
      originalSent: json[_originalSentKey] ?? false,
      originalWritten: json[_originalWrittenKey] ?? false,
      speechToText: json[_speechToTextKey] == null
          ? null
          : SpeechToTextModel.fromJson(json[_speechToTextKey]),
    );
  }

  static const _textKey = "txt";
  static const _langCodeKey = "lang";
  static const _originalSentKey = "snt";
  static const _originalWrittenKey = "wrttn";
  static const _speechToTextKey = "stt";

  Map<String, dynamic> toJson() {
    final data = <String, dynamic>{};
    data[_textKey] = text;
    data[_langCodeKey] = langCode;
    if (originalSent) data[_originalSentKey] = originalSent;
    if (originalWritten) data[_originalWrittenKey] = originalWritten;
    if (speechToText != null) {
      data[_speechToTextKey] = speechToText!.toJson();
    }
    return data;
  }

  /// Get construct uses for the message that weren't captured during language assistance.
  /// Takes a list of tokens and a choreo record, which is searched
  /// through for each token for its construct use type.
  /// Also takes either an event (typically when the Representation itself is
  /// available) or construct use metadata (when the event is not available,
  /// i.e. immediately after message send) to create the construct use.
  List<OneConstructUse> vocabAndMorphUses({
    required List<PangeaToken> tokens,
    Event? event,
    ConstructUseMetaData? metadata,
    ChoreoRecord? choreo,
  }) {
    final List<OneConstructUse> uses = [];
    final l2 = MatrixState.pangeaController.languageController.userL2;
    if (langCode.split("-")[0] != l2?.langCodeShort) return uses;

    // missing vital info so return
    if (event?.roomId == null && metadata?.roomId == null) {
      // debugger(when: kDebugMode);
      return uses;
    }

    metadata ??= ConstructUseMetaData(
      roomId: event!.roomId!,
      eventId: event.eventId,
      timeStamp: event.originServerTs,
    );

    // for each token, record whether selected in ga, ta, or wa
    final tokensToSave =
        tokens.where((token) => token.lemma.saveVocab).toList();
    for (final token in tokensToSave) {
      uses.addAll(
        _getUsesForToken(
          token,
          metadata,
          choreo: choreo,
        ),
      );
    }

    return uses;
  }

  /// Returns a [OneConstructUse] for the given [token]
  /// If there is no [choreo], the [token] is
  /// considered to be a [ConstructUseTypeEnum.wa] as long as it matches the target language.
  /// Later on, we may want to consider putting it in some category of like 'pending'
  ///
  /// For both vocab and morph constructs, we should
  /// 1) give wa if no assistance was used
  /// 2) give ga if IGC was used and
  /// 3) make no use if IT was used
  List<OneConstructUse> _getUsesForToken(
    PangeaToken token,
    ConstructUseMetaData metadata, {
    ChoreoRecord? choreo,
  }) {
    final List<OneConstructUse> uses = [];
    final lemma = token.lemma;
    final content = token.text.content;

    if (choreo == null) {
      uses.add(
        OneConstructUse(
          useType: ConstructUseTypeEnum.wa,
          lemma: token.pos,
          form: token.text.content,
          category: "POS",
          constructType: ConstructTypeEnum.morph,
          metadata: metadata,
        ),
      );

      for (final entry in token.morph.entries) {
        uses.add(
          OneConstructUse(
            useType: ConstructUseTypeEnum.wa,
            lemma: entry.value,
            form: token.text.content,
            category: entry.key,
            constructType: ConstructTypeEnum.morph,
            metadata: metadata,
          ),
        );
      }

      if (lemma.saveVocab) {
        uses.add(
          token.toVocabUse(
            ConstructUseTypeEnum.wa,
            metadata,
          ),
        );
      }
      return uses;
    }

    for (final step in choreo.choreoSteps) {
      /// if 1) accepted match 2) token is in the replacement and 3) replacement
      /// is in the overall step text, then token was a ga
      final bool isAcceptedMatch =
          step.acceptedOrIgnoredMatch?.status == PangeaMatchStatus.accepted;

      // if the token was in an IT match, return no uses
      if (step.itStep != null) return [];

      // if this step was not accepted, continue
      if (!isAcceptedMatch) continue;

      if (isAcceptedMatch &&
          step.acceptedOrIgnoredMatch?.match.choices != null) {
        final choices = step.acceptedOrIgnoredMatch!.match.choices!;
        final bool stepContainedToken = choices.any(
          (choice) =>
              // if this choice contains the token's content
              choice.value.contains(content),
        );
        if (stepContainedToken) {
          // give ga if IGC was used
          uses.add(
            token.toVocabUse(
              ConstructUseTypeEnum.ga,
              metadata,
            ),
          );

          uses.add(
            OneConstructUse(
              useType: ConstructUseTypeEnum.ga,
              lemma: token.pos,
              form: token.text.content,
              category: "POS",
              constructType: ConstructTypeEnum.morph,
              metadata: metadata,
            ),
          );

          for (final entry in token.morph.entries) {
            uses.add(
              OneConstructUse(
                useType: ConstructUseTypeEnum.ga,
                lemma: entry.value,
                form: token.text.content,
                category: entry.key,
                constructType: ConstructTypeEnum.morph,
                metadata: metadata,
              ),
            );
          }
          return uses;
        }
      }
    }

    uses.add(
      OneConstructUse(
        useType: ConstructUseTypeEnum.wa,
        lemma: token.pos,
        form: token.text.content,
        category: "POS",
        constructType: ConstructTypeEnum.morph,
        metadata: metadata,
      ),
    );

    // the token wasn't found in any IT or IGC step, so it was wa
    for (final entry in token.morph.entries) {
      uses.add(
        OneConstructUse(
          useType: ConstructUseTypeEnum.wa,
          lemma: entry.value,
          form: token.text.content,
          category: entry.key,
          constructType: ConstructTypeEnum.morph,
          metadata: metadata,
        ),
      );
    }
    if (lemma.saveVocab) {
      uses.add(
        token.toVocabUse(
          ConstructUseTypeEnum.wa,
          metadata,
        ),
      );
    }
    return uses;
  }
}
fix: fix dart formatting for CI (#1368) * fix: fix dart formatting for CI * fix: sorted imports, updated deprecated flutter functions * fix: format files * fix: format files * feat: replace syncfusion flutter package with excel flutter package * fix: don't run enable google services patch in CI * fix: update iOS supported platforms for enable ios build script * fix: commented out linux build in integrate CI 10 months ago			`import 'package:matrix/matrix.dart';`

Morph-repo-2 (#1681) * feat(morphs): repo for getting lang-specific list of morphs * integrated repo into use of morph features and tags * generated * merged with previous push * generated * generated * chore: fix .env file path --------- Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: ggurdin <46800240+ggurdin@users.noreply.github.com> Co-authored-by: ggurdin <ggurdin@gmail.com> 9 months ago			`import 'package:fluffychat/pangea/analytics_misc/construct_type_enum.dart';`
			`import 'package:fluffychat/pangea/analytics_misc/construct_use_type_enum.dart';`
			`import 'package:fluffychat/pangea/analytics_misc/constructs_model.dart';`
1435 refactor into function specific groupings (#1440) * fix: deleted unreferenced files * fix: sort files based on function 10 months ago			`import 'package:fluffychat/pangea/choreographer/models/choreo_record.dart';`
			`import 'package:fluffychat/pangea/choreographer/models/pangea_match_model.dart';`
			`import 'package:fluffychat/pangea/events/models/pangea_token_model.dart';`
			`import 'package:fluffychat/pangea/toolbar/models/speech_to_text_models.dart';`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`import 'package:fluffychat/widgets/matrix.dart';`
code files 2 years ago
			`/// this class is contained within a [RepresentationEvent]`
			`/// this event is the child of a [EventTypes.Message]`
			`/// the event has two potential children events -`
			`/// [PangeaTokensEvent] and [PangeaIGCEvent]`
			`/// these events contain [PangeaMessageTokens] and [ChoreoRecord], respectively.`
			`class PangeaRepresentation {`
			`/// system-detected language, possibly condensed from a list,`
			`/// but only with high certainty`
			`/// cannot be "unk"`
			`String langCode;`

			`/// final sent text`
			`/// if this was a process, a [PangeaIGCEvent] will contain changes`
			`String text;`

			`bool originalSent;`
			`bool originalWritten;`

full draft speech to text with word level feedback 2 years ago			`// a representation can be create via speech to text on the original message`
			`SpeechToTextModel? speechToText;`

code files 2 years ago			`// how do we know which representation was sent by author?`
			`// RepresentationEvent.text == PangeaMessageEvent.event.body`
			`// use: to know whether directUse`

			`// how do we know which representation was original L1 message that was translated (if it exists)?`
			`// (of l2 rep) RepresentationEvent.igc.steps.first.text = RepresentationEvent.text (of L1 rep)`
			`// use: for base text for future translations`

			`// os = true and ow = false`
			`// rep that went through IGC/IT`

			`// os = false and ow = false`
			`// rep added by other user`

			`// os = true and ow = true`
			`// potentially L1 language use, maybe with limited IGC, and ignored out of target cries`
			`// potentially perfect L2 use`

			`// os = false and ow = true`
			`// L1 message that then went through significant IGC and/or IT`
			`// L2 message with errors that went through IGC`

			`PangeaRepresentation({`
			`required this.langCode,`
			`required this.text,`
			`required this.originalSent,`
			`required this.originalWritten,`
full draft speech to text with word level feedback 2 years ago			`this.speechToText,`
code files 2 years ago			`});`

full draft speech to text with word level feedback 2 years ago			`factory PangeaRepresentation.fromJson(Map<String, dynamic> json) {`
			`return PangeaRepresentation(`
			`langCode: json[_langCodeKey],`
			`text: json[_textKey],`
			`originalSent: json[_originalSentKey] ?? false,`
			`originalWritten: json[_originalWrittenKey] ?? false,`
			`speechToText: json[_speechToTextKey] == null`
			`? null`
			`: SpeechToTextModel.fromJson(json[_speechToTextKey]),`
			`);`
			`}`
code files 2 years ago
			`static const _textKey = "txt";`
			`static const _langCodeKey = "lang";`
			`static const _originalSentKey = "snt";`
			`static const _originalWrittenKey = "wrttn";`
full draft speech to text with word level feedback 2 years ago			`static const _speechToTextKey = "stt";`
code files 2 years ago
			`Map<String, dynamic> toJson() {`
			`final data = <String, dynamic>{};`
			`data[_textKey] = text;`
			`data[_langCodeKey] = langCode;`
			`if (originalSent) data[_originalSentKey] = originalSent;`
			`if (originalWritten) data[_originalWrittenKey] = originalWritten;`
full draft speech to text with word level feedback 2 years ago			`if (speechToText != null) {`
			`data[_speechToTextKey] = speechToText!.toJson();`
			`}`
code files 2 years ago			`return data;`
			`}`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago
update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`/// Get construct uses for the message that weren't captured during language assistance.`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`/// Takes a list of tokens and a choreo record, which is searched`
			`/// through for each token for its construct use type.`
			`/// Also takes either an event (typically when the Representation itself is`
			`/// available) or construct use metadata (when the event is not available,`
			`/// i.e. immediately after message send) to create the construct use.`
update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`List<OneConstructUse> vocabAndMorphUses({`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`required List<PangeaToken> tokens,`
			`Event? event,`
			`ConstructUseMetaData? metadata,`
			`ChoreoRecord? choreo,`
			`}) {`
			`final List<OneConstructUse> uses = [];`
Unborked locales (#1741) * feat: localized languages --------- Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: ggurdin <ggurdin@gmail.com> Co-authored-by: ggurdin <46800240+ggurdin@users.noreply.github.com> 9 months ago			`final l2 = MatrixState.pangeaController.languageController.userL2;`
			`if (langCode.split("-")[0] != l2?.langCodeShort) return uses;`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago
			`// missing vital info so return`
			`if (event?.roomId == null && metadata?.roomId == null) {`
			`// debugger(when: kDebugMode);`
			`return uses;`
			`}`

			`metadata ??= ConstructUseMetaData(`
			`roomId: event!.roomId!,`
			`eventId: event.eventId,`
			`timeStamp: event.originServerTs,`
			`);`

			`// for each token, record whether selected in ga, ta, or wa`
			`final tokensToSave =`
			`tokens.where((token) => token.lemma.saveVocab).toList();`
			`for (final token in tokensToSave) {`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago			`uses.addAll(`
some questions, name changes, and a couple switches from grammar to morph uses 1 year ago			`_getUsesForToken(`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`token,`
			`metadata,`
			`choreo: choreo,`
			`),`
			`);`
			`}`

			`return uses;`
			`}`

			`/// Returns a [OneConstructUse] for the given [token]`
			`/// If there is no [choreo], the [token] is`
			`/// considered to be a [ConstructUseTypeEnum.wa] as long as it matches the target language.`
			`/// Later on, we may want to consider putting it in some category of like 'pending'`
update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`///`
			`/// For both vocab and morph constructs, we should`
			`/// 1) give wa if no assistance was used`
			`/// 2) give ga if IGC was used and`
			`/// 3) make no use if IT was used`
some questions, name changes, and a couple switches from grammar to morph uses 1 year ago			`List<OneConstructUse> _getUsesForToken(`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`PangeaToken token,`
			`ConstructUseMetaData metadata, {`
			`ChoreoRecord? choreo,`
			`}) {`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago			`final List<OneConstructUse> uses = [];`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`final lemma = token.lemma;`
			`final content = token.text.content;`

			`if (choreo == null) {`
use target tokens instead of target constructs to get practice activi… (#1274) * use target tokens instead of target constructs to get practice activity uses * save morph construct for token parts of speech 11 months ago			`uses.add(`
			`OneConstructUse(`
feat: don't award analytics data for messages not in l2 (#1686) 9 months ago			`useType: ConstructUseTypeEnum.wa,`
use target tokens instead of target constructs to get practice activi… (#1274) * use target tokens instead of target constructs to get practice activity uses * save morph construct for token parts of speech 11 months ago			`lemma: token.pos,`
			`form: token.text.content,`
			`category: "POS",`
			`constructType: ConstructTypeEnum.morph,`
			`metadata: metadata,`
			`),`
			`);`

added 'categories' field to construct use model and started saving morph category 1 year ago			`for (final entry in token.morph.entries) {`
			`uses.add(`
			`OneConstructUse(`
feat: don't award analytics data for messages not in l2 (#1686) 9 months ago			`useType: ConstructUseTypeEnum.wa,`
added 'categories' field to construct use model and started saving morph category 1 year ago			`lemma: entry.value,`
guess grammar category when missing, saving form when available 12 months ago			`form: token.text.content,`
make construct use category a String? instead of a list, set it to POS for vocab constructs 1 year ago			`category: entry.key,`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago			`constructType: ConstructTypeEnum.morph,`
			`metadata: metadata,`
			`),`
added 'categories' field to construct use model and started saving morph category 1 year ago			`);`
			`}`
filter out lemmas with saveVocab set to false 1 year ago
			`if (lemma.saveVocab) {`
			`uses.add(`
make construct use category a String? instead of a list, set it to POS for vocab constructs 1 year ago			`token.toVocabUse(`
feat: don't award analytics data for messages not in l2 (#1686) 9 months ago			`ConstructUseTypeEnum.wa,`
filter out lemmas with saveVocab set to false 1 year ago			`metadata,`
			`),`
			`);`
			`}`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago			`return uses;`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`}`

			`for (final step in choreo.choreoSteps) {`
			`/// if 1) accepted match 2) token is in the replacement and 3) replacement`
			`/// is in the overall step text, then token was a ga`
			`final bool isAcceptedMatch =`
			`step.acceptedOrIgnoredMatch?.status == PangeaMatchStatus.accepted;`
update vocabUses function to save tokens in matches as GA construct uses 1 year ago
			`// if the token was in an IT match, return no uses`
			`if (step.itStep != null) return [];`

			`// if this step was not accepted, continue`
			`if (!isAcceptedMatch) continue;`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago
			`if (isAcceptedMatch &&`
			`step.acceptedOrIgnoredMatch?.match.choices != null) {`
			`final choices = step.acceptedOrIgnoredMatch!.match.choices!;`
			`final bool stepContainedToken = choices.any(`
			`(choice) =>`
			`// if this choice contains the token's content`
update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`choice.value.contains(content),`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`);`
			`if (stepContainedToken) {`
update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`// give ga if IGC was used`
			`uses.add(`
resolved merge conflicts 1 year ago			`token.toVocabUse(`
update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`ConstructUseTypeEnum.ga,`
			`metadata,`
			`),`
			`);`
use target tokens instead of target constructs to get practice activi… (#1274) * use target tokens instead of target constructs to get practice activity uses * save morph construct for token parts of speech 11 months ago
			`uses.add(`
			`OneConstructUse(`
			`useType: ConstructUseTypeEnum.ga,`
			`lemma: token.pos,`
			`form: token.text.content,`
			`category: "POS",`
			`constructType: ConstructTypeEnum.morph,`
			`metadata: metadata,`
			`),`
			`);`

update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`for (final entry in token.morph.entries) {`
			`uses.add(`
			`OneConstructUse(`
			`useType: ConstructUseTypeEnum.ga,`
			`lemma: entry.value,`
guess grammar category when missing, saving form when available 12 months ago			`form: token.text.content,`
resolved merge conflicts 1 year ago			`category: entry.key,`
update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`constructType: ConstructTypeEnum.morph,`
			`metadata: metadata,`
			`),`
			`);`
			`}`
			`return uses;`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`}`
			`}`
			`}`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago
use target tokens instead of target constructs to get practice activi… (#1274) * use target tokens instead of target constructs to get practice activity uses * save morph construct for token parts of speech 11 months ago			`uses.add(`
			`OneConstructUse(`
			`useType: ConstructUseTypeEnum.wa,`
			`lemma: token.pos,`
			`form: token.text.content,`
			`category: "POS",`
			`constructType: ConstructTypeEnum.morph,`
			`metadata: metadata,`
			`),`
			`);`

update vocabUses function to save tokens in matches as GA construct uses 1 year ago			`// the token wasn't found in any IT or IGC step, so it was wa`
added 'categories' field to construct use model and started saving morph category 1 year ago			`for (final entry in token.morph.entries) {`
			`uses.add(`
			`OneConstructUse(`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago			`useType: ConstructUseTypeEnum.wa,`
added 'categories' field to construct use model and started saving morph category 1 year ago			`lemma: entry.value,`
guess grammar category when missing, saving form when available 12 months ago			`form: token.text.content,`
make construct use category a String? instead of a list, set it to POS for vocab constructs 1 year ago			`category: entry.key,`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago			`constructType: ConstructTypeEnum.morph,`
			`metadata: metadata,`
			`),`
added 'categories' field to construct use model and started saving morph category 1 year ago			`);`
			`}`
filter out lemmas with saveVocab set to false 1 year ago			`if (lemma.saveVocab) {`
			`uses.add(`
make construct use category a String? instead of a list, set it to POS for vocab constructs 1 year ago			`token.toVocabUse(`
filter out lemmas with saveVocab set to false 1 year ago			`ConstructUseTypeEnum.wa,`
			`metadata,`
			`),`
			`);`
			`}`
add draft construct uses while using language assistance, added morphs to learning progress indicators 1 year ago			`return uses;`
moved functions for constructing constructs out of pangea message event so they can be created without direct access to the representation event 1 year ago			`}`
code files 2 years ago			`}`