From f0260aa94ca54775274a34e5175fa61a1ecfece3 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jo=C3=A3o=20Fernandes?= Date: Mon, 20 May 2024 03:14:04 -0300 Subject: [PATCH] [gleam] complete protein-translation --- gleam/protein-translation/.gitignore | 4 + gleam/protein-translation/HELP.md | 32 +++ gleam/protein-translation/README.md | 60 ++++++ gleam/protein-translation/gleam.toml | 12 ++ gleam/protein-translation/manifest.toml | 27 +++ .../src/protein_translation.gleam | 19 ++ .../test/protein_translation_test.gleam | 187 ++++++++++++++++++ 7 files changed, 341 insertions(+) create mode 100644 gleam/protein-translation/.gitignore create mode 100644 gleam/protein-translation/HELP.md create mode 100644 gleam/protein-translation/README.md create mode 100644 gleam/protein-translation/gleam.toml create mode 100644 gleam/protein-translation/manifest.toml create mode 100644 gleam/protein-translation/src/protein_translation.gleam create mode 100644 gleam/protein-translation/test/protein_translation_test.gleam diff --git a/gleam/protein-translation/.gitignore b/gleam/protein-translation/.gitignore new file mode 100644 index 0000000..170cca9 --- /dev/null +++ b/gleam/protein-translation/.gitignore @@ -0,0 +1,4 @@ +*.beam +*.ez +build +erl_crash.dump diff --git a/gleam/protein-translation/HELP.md b/gleam/protein-translation/HELP.md new file mode 100644 index 0000000..33f3584 --- /dev/null +++ b/gleam/protein-translation/HELP.md @@ -0,0 +1,32 @@ +# Help + +## Running the tests + +To run the tests, run the command `gleam test` from within the exercise directory. + +## Submitting your solution + +You can submit your solution using the `exercism submit src/protein_translation.gleam` command. +This command will upload your solution to the Exercism website and print the solution page's URL. + +It's possible to submit an incomplete solution which allows you to: + +- See how others have completed the exercise +- Request help from a mentor + +## Need to get help? + +If you'd like help solving the exercise, check the following pages: + +- The [Gleam track's documentation](https://exercism.org/docs/tracks/gleam) +- The [Gleam track's programming category on the forum](https://forum.exercism.org/c/programming/gleam) +- [Exercism's programming category on the forum](https://forum.exercism.org/c/programming/5) +- The [Frequently Asked Questions](https://exercism.org/docs/using/faqs) + +Should those resources not suffice, you could submit your (incomplete) solution to request mentoring. + +To get help if you're having trouble, you can use one of the following resources: + +- [gleam.run](https://gleam.run/documentation/) is the gleam official documentation. +- [Discord](https://discord.gg/Fm8Pwmy) is the discord channel. +- [StackOverflow](https://stackoverflow.com/questions/tagged/gleam) can be used to search for your problem and see if it has been answered already. You can also ask and answer questions. \ No newline at end of file diff --git a/gleam/protein-translation/README.md b/gleam/protein-translation/README.md new file mode 100644 index 0000000..2e4dfec --- /dev/null +++ b/gleam/protein-translation/README.md @@ -0,0 +1,60 @@ +# Protein Translation + +Welcome to Protein Translation on Exercism's Gleam Track. +If you need help running the tests or submitting your code, check out `HELP.md`. + +## Instructions + +Translate RNA sequences into proteins. + +RNA can be broken into three nucleotide sequences called codons, and then translated to a polypeptide like so: + +RNA: `"AUGUUUUCU"` => translates to + +Codons: `"AUG", "UUU", "UCU"` +=> which become a polypeptide with the following sequence => + +Protein: `"Methionine", "Phenylalanine", "Serine"` + +There are 64 codons which in turn correspond to 20 amino acids; however, all of the codon sequences and resulting amino acids are not important in this exercise. +If it works for one codon, the program should work for all of them. +However, feel free to expand the list in the test suite to include them all. + +There are also three terminating codons (also known as 'STOP' codons); if any of these codons are encountered (by the ribosome), all translation ends and the protein is terminated. + +All subsequent codons after are ignored, like this: + +RNA: `"AUGUUUUCUUAAAUG"` => + +Codons: `"AUG", "UUU", "UCU", "UAA", "AUG"` => + +Protein: `"Methionine", "Phenylalanine", "Serine"` + +Note the stop codon `"UAA"` terminates the translation and the final methionine is not translated into the protein sequence. + +Below are the codons and resulting Amino Acids needed for the exercise. + +| Codon | Protein | +| :----------------- | :------------ | +| AUG | Methionine | +| UUU, UUC | Phenylalanine | +| UUA, UUG | Leucine | +| UCU, UCC, UCA, UCG | Serine | +| UAU, UAC | Tyrosine | +| UGU, UGC | Cysteine | +| UGG | Tryptophan | +| UAA, UAG, UGA | STOP | + +Learn more about [protein translation on Wikipedia][protein-translation]. + +[protein-translation]: https://en.wikipedia.org/wiki/Translation_(biology) + +## Source + +### Created by + +- @lpil + +### Based on + +Tyler Long \ No newline at end of file diff --git a/gleam/protein-translation/gleam.toml b/gleam/protein-translation/gleam.toml new file mode 100644 index 0000000..0389d20 --- /dev/null +++ b/gleam/protein-translation/gleam.toml @@ -0,0 +1,12 @@ +name = "protein_translation" +version = "0.1.0" + +[dependencies] +gleam_bitwise = "~> 1.2" +gleam_otp = "~> 0.7 or ~> 1.0" +gleam_stdlib = "~> 0.32 or ~> 1.0" +simplifile = "~> 1.0" +gleam_erlang = ">= 0.25.0 and < 1.0.0" + +[dev-dependencies] +exercism_test_runner = "~> 1.4" diff --git a/gleam/protein-translation/manifest.toml b/gleam/protein-translation/manifest.toml new file mode 100644 index 0000000..072155d --- /dev/null +++ b/gleam/protein-translation/manifest.toml @@ -0,0 +1,27 @@ +# This file was generated by Gleam +# You typically do not need to edit this file + +packages = [ + { name = "argv", version = "1.0.1", build_tools = ["gleam"], requirements = [], otp_app = "argv", source = "hex", outer_checksum = "A6E9009E50BBE863EB37D963E4315398D41A3D87D0075480FC244125808F964A" }, + { name = "exercism_test_runner", version = "1.7.0", build_tools = ["gleam"], requirements = ["argv", "gap", "glance", "gleam_community_ansi", "gleam_erlang", "gleam_json", "gleam_stdlib", "simplifile"], otp_app = "exercism_test_runner", source = "hex", outer_checksum = "2FC1BADB19BEC2AE77BFD2D3A606A014C85412A7B874CAFC4BA8CF04B0B257CD" }, + { name = "gap", version = "1.1.0", build_tools = ["gleam"], requirements = ["gleam_community_ansi", "gleam_stdlib"], otp_app = "gap", source = "hex", outer_checksum = "2EE1B0A17E85CF73A0C1D29DA315A2699117A8F549C8E8D89FA8261BE41EDEB1" }, + { name = "glance", version = "0.8.2", build_tools = ["gleam"], requirements = ["gleam_stdlib", "glexer"], otp_app = "glance", source = "hex", outer_checksum = "ACF09457E8B564AD7A0D823DAFDD326F58263C01ACB0D432A9BEFDEDD1DA8E73" }, + { name = "gleam_bitwise", version = "1.3.1", build_tools = ["gleam"], requirements = [], otp_app = "gleam_bitwise", source = "hex", outer_checksum = "B36E1D3188D7F594C7FD4F43D0D2CE17561DE896202017548578B16FE1FE9EFC" }, + { name = "gleam_community_ansi", version = "1.4.0", build_tools = ["gleam"], requirements = ["gleam_community_colour", "gleam_stdlib"], otp_app = "gleam_community_ansi", source = "hex", outer_checksum = "FE79E08BF97009729259B6357EC058315B6FBB916FAD1C2FF9355115FEB0D3A4" }, + { name = "gleam_community_colour", version = "1.3.0", build_tools = ["gleam"], requirements = ["gleam_stdlib"], otp_app = "gleam_community_colour", source = "hex", outer_checksum = "A49A5E3AE8B637A5ACBA80ECB9B1AFE89FD3D5351FF6410A42B84F666D40D7D5" }, + { name = "gleam_erlang", version = "0.25.0", build_tools = ["gleam"], requirements = ["gleam_stdlib"], otp_app = "gleam_erlang", source = "hex", outer_checksum = "054D571A7092D2A9727B3E5D183B7507DAB0DA41556EC9133606F09C15497373" }, + { name = "gleam_json", version = "1.0.0", build_tools = ["gleam"], requirements = ["gleam_stdlib", "thoas"], otp_app = "gleam_json", source = "hex", outer_checksum = "8B197DD5D578EA6AC2C0D4BDC634C71A5BCA8E7DB5F47091C263ECB411A60DF3" }, + { name = "gleam_otp", version = "0.10.0", build_tools = ["gleam"], requirements = ["gleam_erlang", "gleam_stdlib"], otp_app = "gleam_otp", source = "hex", outer_checksum = "0B04FE915ACECE539B317F9652CAADBBC0F000184D586AAAF2D94C100945D72B" }, + { name = "gleam_stdlib", version = "0.36.0", build_tools = ["gleam"], requirements = [], otp_app = "gleam_stdlib", source = "hex", outer_checksum = "C0D14D807FEC6F8A08A7C9EF8DFDE6AE5C10E40E21325B2B29365965D82EB3D4" }, + { name = "glexer", version = "0.7.0", build_tools = ["gleam"], requirements = ["gleam_stdlib"], otp_app = "glexer", source = "hex", outer_checksum = "4484942A465482A0A100936E1E5F12314DB4B5AC0D87575A7B9E9062090B96BE" }, + { name = "simplifile", version = "1.5.0", build_tools = ["gleam"], requirements = ["gleam_stdlib"], otp_app = "simplifile", source = "hex", outer_checksum = "EB9AA8E65E5C1E3E0FDCFC81BC363FD433CB122D7D062750FFDF24DE4AC40116" }, + { name = "thoas", version = "0.4.1", build_tools = ["rebar3"], requirements = [], otp_app = "thoas", source = "hex", outer_checksum = "4918D50026C073C4AB1388437132C77A6F6F7C8AC43C60C13758CC0ADCE2134E" }, +] + +[requirements] +exercism_test_runner = { version = "~> 1.4" } +gleam_bitwise = { version = "~> 1.2" } +gleam_erlang = { version = ">= 0.25.0 and < 1.0.0"} +gleam_otp = { version = "~> 0.7 or ~> 1.0" } +gleam_stdlib = { version = "~> 0.32 or ~> 1.0" } +simplifile = { version = "~> 1.0" } diff --git a/gleam/protein-translation/src/protein_translation.gleam b/gleam/protein-translation/src/protein_translation.gleam new file mode 100644 index 0000000..a0fcca3 --- /dev/null +++ b/gleam/protein-translation/src/protein_translation.gleam @@ -0,0 +1,19 @@ +import gleam/list + +pub fn proteins(rna: String) -> Result(List(String), Nil) { + translate(rna, []) +} + +fn translate(rna: String, acc: List(String)) -> Result(List(String), Nil) { + case rna { + "AUG" <> rest -> translate(rest, ["Methionine", ..acc]) + "UUU" <> rest | "UUC" <> rest -> translate(rest, ["Phenylalanine", ..acc]) + "UUA" <> rest | "UUG" <> rest -> translate(rest, ["Leucine", ..acc]) + "UCU" <> rest | "UCC" <> rest | "UCA" <> rest | "UCG" <> rest -> translate(rest, ["Serine", ..acc]) + "UAU" <> rest | "UAC" <> rest -> translate(rest, ["Tyrosine", ..acc]) + "UGU" <> rest | "UGC" <> rest -> translate(rest, ["Cysteine", ..acc]) + "UGG" <> rest -> translate(rest, ["Tryptophan", ..acc]) + "UAA" <> _ | "UAG" <> _ | "UGA" <> _ | "" -> Ok(list.reverse(acc)) + _ -> Error(Nil) + } +} diff --git a/gleam/protein-translation/test/protein_translation_test.gleam b/gleam/protein-translation/test/protein_translation_test.gleam new file mode 100644 index 0000000..e7b3054 --- /dev/null +++ b/gleam/protein-translation/test/protein_translation_test.gleam @@ -0,0 +1,187 @@ +import exercism/should +import exercism/test_runner +import protein_translation + +pub fn main() { + test_runner.main() +} + +pub fn empty_rna_sequence_results_in_no_proteins_test() { + "" + |> protein_translation.proteins + |> should.equal(Ok([])) +} + +pub fn methione_rna_sequence_test() { + "AUG" + |> protein_translation.proteins + |> should.equal(Ok(["Methionine"])) +} + +pub fn phenylalanine_rna_sequence_1_test() { + "UUU" + |> protein_translation.proteins + |> should.equal(Ok(["Phenylalanine"])) +} + +pub fn phenylalanine_rna_sequence_2_test() { + "UUC" + |> protein_translation.proteins + |> should.equal(Ok(["Phenylalanine"])) +} + +pub fn leucine_rna_sequence_1_test() { + "UUA" + |> protein_translation.proteins + |> should.equal(Ok(["Leucine"])) +} + +pub fn leucine_rna_sequence_2_test() { + "UUG" + |> protein_translation.proteins + |> should.equal(Ok(["Leucine"])) +} + +pub fn serine_rna_sequence_1_test() { + "UCU" + |> protein_translation.proteins + |> should.equal(Ok(["Serine"])) +} + +pub fn serine_rna_sequence_2_test() { + "UCC" + |> protein_translation.proteins + |> should.equal(Ok(["Serine"])) +} + +pub fn serine_rna_sequence_3_test() { + "UCA" + |> protein_translation.proteins + |> should.equal(Ok(["Serine"])) +} + +pub fn serine_rna_sequence_4_test() { + "UCG" + |> protein_translation.proteins + |> should.equal(Ok(["Serine"])) +} + +pub fn tyrosine_rna_sequence_1_test() { + "UAU" + |> protein_translation.proteins + |> should.equal(Ok(["Tyrosine"])) +} + +pub fn tyrosine_rna_sequence_2_test() { + "UAC" + |> protein_translation.proteins + |> should.equal(Ok(["Tyrosine"])) +} + +pub fn cysteine_rna_sequence_1_test() { + "UGU" + |> protein_translation.proteins + |> should.equal(Ok(["Cysteine"])) +} + +pub fn cysteine_rna_sequence_2_test() { + "UGC" + |> protein_translation.proteins + |> should.equal(Ok(["Cysteine"])) +} + +pub fn tryptophan_rna_sequence_test() { + "UGG" + |> protein_translation.proteins + |> should.equal(Ok(["Tryptophan"])) +} + +pub fn stop_codon_rna_sequence_1_test() { + "UAA" + |> protein_translation.proteins + |> should.equal(Ok([])) +} + +pub fn stop_codon_rna_sequence_2_test() { + "UAG" + |> protein_translation.proteins + |> should.equal(Ok([])) +} + +pub fn stop_codon_rna_sequence_3_test() { + "UGA" + |> protein_translation.proteins + |> should.equal(Ok([])) +} + +pub fn sequence_of_two_protein_codons_translates_into_proteins_test() { + "UUUUUU" + |> protein_translation.proteins + |> should.equal(Ok(["Phenylalanine", "Phenylalanine"])) +} + +pub fn sequence_of_two_different_protein_codons_translates_into_proteins_test() { + "UUAUUG" + |> protein_translation.proteins + |> should.equal(Ok(["Leucine", "Leucine"])) +} + +pub fn translate_rna_strand_into_correct_protein_list_test() { + "AUGUUUUGG" + |> protein_translation.proteins + |> should.equal(Ok(["Methionine", "Phenylalanine", "Tryptophan"])) +} + +pub fn translation_stops_if_stop_codon_at_beginning_of_sequence_test() { + "UAGUGG" + |> protein_translation.proteins + |> should.equal(Ok([])) +} + +pub fn translation_stops_if_stop_codon_at_end_of_two_codon_sequence_test() { + "UGGUAG" + |> protein_translation.proteins + |> should.equal(Ok(["Tryptophan"])) +} + +pub fn translation_stops_if_stop_codon_at_end_of_three_codon_sequence_test() { + "AUGUUUUAA" + |> protein_translation.proteins + |> should.equal(Ok(["Methionine", "Phenylalanine"])) +} + +pub fn translation_stops_if_stop_codon_in_middle_of_three_codon_sequence_test() { + "UGGUAGUGG" + |> protein_translation.proteins + |> should.equal(Ok(["Tryptophan"])) +} + +pub fn non_existing_codon_cant_translate_test() { + "AAA" + |> protein_translation.proteins + |> should.equal(Error(Nil)) +} + +pub fn unknown_amino_acids_not_part_of_a_codon_cant_translate_test() { + "XYZ" + |> protein_translation.proteins + |> should.equal(Error(Nil)) +} + +pub fn incomplete_rna_sequence_cant_translate_test() { + "AUGU" + |> protein_translation.proteins + |> should.equal(Error(Nil)) +} + +pub fn translation_stops_if_stop_codon_in_middle_of_six_codon_sequence_test() { + "UGGUGUUAUUAAUGGUUU" + |> protein_translation.proteins + |> should.equal(Ok(["Tryptophan", "Cysteine", "Tyrosine"])) +} + +pub fn incomplete_rna_sequence_can_translate_if_valid_until_a_stop_codon_test() { + "UUCUUCUAAUGGU" + |> protein_translation.proteins + |> should.equal(Ok(["Phenylalanine", "Phenylalanine"])) +}