Minimum Genetic Mutation

                                            
class Solution {
public:
    int minMutation(string startGene, string endGene, vector<string>& bank) {
        unordered_set<string> geneBank(bank.begin(), bank.end());
        if (geneBank.find(endGene) == geneBank.end()) {
            return -1;
        }
        
        queue<string> q;
        q.push(startGene);
        int mutations = 0;
        vector<char> bases = {'A', 'C', 'G', 'T'};
        
        while (!q.empty()) {
            int size = q.size();
            for (int i = 0; i < size; i++) {
                string currentGene = q.front();
                q.pop();
                
                if (currentGene == endGene) {
                    return mutations;
                }
                
                for (int j = 0; j < 8; j++) {
                    char originalChar = currentGene[j];
                    for (char base : bases) {
                        currentGene[j] = base;
                        if (geneBank.find(currentGene) != geneBank.end()) {
                            q.push(currentGene);
                            geneBank.erase(currentGene);
                        }
                    }
                    currentGene[j] = originalChar;
                }
            }
            mutations++;
        }
        
        return -1;
    }
};

                                            
class Solution {
    public int minMutation(String startGene, String endGene, String[] bank) {
        Set<String> bankSet = new HashSet<>(Arrays.asList(bank));
        if (!bankSet.contains(endGene)) {
            return -1;
        }
        
        char[] choices = {'A', 'C', 'G', 'T'};
        
        Queue<String> queue = new LinkedList<>();
        Set<String> visited = new HashSet<>();
        
        queue.offer(startGene);
        visited.add(startGene);
        
        int mutations = 0;
        
        while (!queue.isEmpty()) {
            int size = queue.size();
            for (int i = 0; i < size; i++) {
                String current = queue.poll();
                if (current.equals(endGene)) {
                    return mutations;
                }
                
                char[] currentChars = current.toCharArray();
                for (int j = 0; j < currentChars.length; j++) {
                    char originalChar = currentChars[j];
                    for (char c : choices) {
                        currentChars[j] = c;
                        String newGene = new String(currentChars);
                        if (!visited.contains(newGene) && bankSet.contains(newGene)) {
                            visited.add(newGene);
                            queue.offer(newGene);
                        }
                    }
                    currentChars[j] = originalChar;
                }
            }
            
            mutations++;
        }
        
        return -1;
    }
}

                                            
class Solution(object):
    def minMutation(self, startGene, endGene, bank):
        if endGene not in bank:
            return -1
        
        queue = [(startGene, 0)]
        visited = set()
        
        while queue:
            gene, mutations = queue.pop(0)
            
            if gene == endGene:
                return mutations
            
            for i in range(len(gene)):
                for nucleotide in ['A', 'C', 'G', 'T']:
                    newGene = gene[:i] + nucleotide + gene[i+1:]
                    
                    if newGene in bank and newGene not in visited:
                        visited.add(newGene)
                        queue.append((newGene, mutations + 1))
        
        return -1

                                            
public class Solution {
    public int MinMutation(string startGene, string endGene, string[] bank) {
        if (startGene == endGene) return 0;
        
        HashSet<string> bankSet = new HashSet<string>(bank);
        if (!bankSet.Contains(endGene)) return -1;
        
        HashSet<string> visited = new HashSet<string>();
        visited.Add(startGene);
        
        Queue<string> queue = new Queue<string>();
        queue.Enqueue(startGene);
        
        char[] genes = new char[] { 'A', 'C', 'G', 'T' };
        
        int mutations = 0;
        
        while (queue.Count > 0) {
            int size = queue.Count;
            
            for (int i = 0; i < size; i++) {
                string currentGene = queue.Dequeue();
                
                if (currentGene == endGene) {
                    return mutations;
                }
                
                char[] geneArray = currentGene.ToCharArray();
                
                for (int j = 0; j < geneArray.Length; j++) {
                    char originalChar = geneArray[j];
                    
                    foreach (char c in genes) {
                        geneArray[j] = c;
                        string newGene = new string(geneArray);
                        
                        if (bankSet.Contains(newGene) && !visited.Contains(newGene)) {
                            visited.Add(newGene);
                            queue.Enqueue(newGene);
                        }
                    }
                    
                    geneArray[j] = originalChar;
                }
            }
            
            mutations++;
        }
        
        return -1;
    }
}

                                            
/**
 * @param {string} startGene
 * @param {string} endGene
 * @param {string[]} bank
 * @return {number}
 */
var minMutation = function(startGene, endGene, bank) {
    if (startGene === endGene) return 0;
    
    let queue = [[startGene, 0]];
    let bankSet = new Set(bank);
    
    while (queue.length > 0) {
        let [gene, steps] = queue.shift();
        
        if (gene === endGene) return steps;
        
        for (let i = 0; i < gene.length; i++) {
            for (let char of "ACGT") {
                if (gene[i] === char) continue;
                
                let mutated = gene.slice(0, i) + char + gene.slice(i + 1);
                
                if (bankSet.has(mutated)) {
                    queue.push([mutated, steps + 1]);
                    bankSet.delete(mutated);
                }
            }
        }
    }
    
    return -1;
};

                                            
class Solution {
    /**
     * @param String $startGene
     * @param String $endGene
     * @param String[] $bank
     * @return Integer
     */
    function minMutation($startGene, $endGene, $bank) {
        $queue = [[$startGene, 0]];
        $bankSet = array_flip($bank);
        
        while (!empty($queue)) {
            [$gene, $steps] = array_shift($queue);
            if ($gene == $endGene) {
                return $steps;
            }
            
            for ($i = 0; $i < strlen($gene); $i++) {
                foreach (['A', 'C', 'G', 'T'] as $replace) {
                    if ($gene[$i] == $replace) continue;
                    $newGene = substr_replace($gene, $replace, $i, 1);
                    if (isset($bankSet[$newGene])) {
                        unset($bankSet[$newGene]); // Mark as visited
                        $queue[] = [$newGene, $steps + 1];
                    }
                }
            }
        }
        
        return -1;
    }
}

                                            
class Solution {
    func minMutation(_ startGene: String, _ endGene: String, _ bank: [String]) -> Int {
        if !bank.contains(endGene) {
            return -1
        }
        
        var visited = Set<String>()
        var queue = [(startGene, 0)]
        
        while !queue.isEmpty {
            let currentGene = queue.removeFirst()
            let gene = currentGene.0
            let mutations = currentGene.1
            
            if gene == endGene {
                return mutations
            }
            
            for nextGene in bank {
                if !visited.contains(nextGene) && isOneMutationApart(gene, nextGene) {
                    visited.insert(nextGene)
                    queue.append((nextGene, mutations + 1))
                }
            }
        }
        
        return -1
    }
    
    func isOneMutationApart(_ gene1: String, _ gene2: String) -> Bool {
        var differences = 0
        for i in 0..<gene1.count {
            if gene1[gene1.index(gene1.startIndex, offsetBy: i)] != gene2[gene2.index(gene2.startIndex, offsetBy: i)] {
                differences += 1
            }
            if differences > 1 {
                return false
            }
        }
        return differences == 1
    }
}

To solve this coding challenge, we need to develop a method that will navigate through the possible mutations of a gene string from the

startGene

to the

endGene

. The gene string must evolve one mutation at a time, with each step being a valid gene from the provided gene bank.

Explanation

Initialization and Input Checks : We'll verify whether the
endGene

exists within the
bank

. If not, it's impossible to reach the
endGene

from the
startGene

as per the problem's restrictions, and we'll return
-1

.
Breadth-First Search (BFS) : This search technique is ideal here because it explores all possible mutations at each level before moving on to mutations from the next level. This ensures that we find the shortest possible path from
startGene

to
endGene

. We'll use a queue to implement BFS.
Queue Operation :

The queue will store tuples containing the current gene string and the number of mutations taken to reach it.
We initiate the queue with the
startGene

and a mutation count of
0

.

Visited Set : To avoid revisiting gene strings and potential infinite loops, we'll maintain a set of visited gene strings.
Processing Each Gene :

For each gene string and mutation count in the queue, we will check if the current gene matches the
endGene

.
If it matches, return the current mutation count as it represents the minimum mutations needed.

Generating Mutations :

For each character in the gene string, we will attempt to mutate it to one of the other valid characters ('A', 'C', 'G', 'T').
For each mutation, we will check if the new gene string is in the bank and hasn't been visited.
If valid, add the new gene string to the queue with an incremented mutation count and mark it as visited.

End Condition : If the queue is exhausted and no path to
endGene

is found, return
-1

.

Detailed Steps in Pseudocode

Initialize an empty set
visited

to keep track of visited gene strings.
Initialize the queue with the tuple
(startGene, 0)

and add
startGene

to visited.
Check if
endGene

is in the
bank

. If not, return
-1

.
While the queue is not empty, do the following:

Dequeue the front element (currentGene, currentMutations).
If
currentGene == endGene

, return
currentMutations

.
For each character position in
currentGene

:

Try mutating to each possible nucleotide ('A', 'C', 'G', 'T').
If the resulting new gene string is valid (in
bank

and not visited):

Mark it as visited.
Enqueue the new gene string with the incremented mutation count.

If the queue is exhausted without finding
endGene

, return
-1

.

Pseudocode

                                            
# Check for endGene in bank
if endGene not in bank:
    # If endGene is not in bank, return -1
    return -1

# Initialize variables
# Queue to store current gene string and its mutation count
queue = [(startGene, 0)]
# Set to store visited gene strings
visited = set()
# Add startGene to visited
visited.add(startGene)

# BFS loop while queue is not empty
while queue is not empty:
    # Dequeue the front element (current gene string and mutation count)
    currentGene, currentMutations = queue.pop(0)
    
    # Check if current gene matches the end gene
    if currentGene == endGene:
        # If matched, return the current number of mutations
        return currentMutations
    
    # Try mutating every character of the current gene
    for i in range(len(currentGene)):
        # For every nucleotide, attempt mutation
        for nucleotide in ['A', 'C', 'G', 'T']:
            # Create a new gene string by changing one nucleotide
            newGene = currentGene[:i] + nucleotide + currentGene[i+1:]
            
            # Check if new gene string is valid and not visited
            if newGene in bank and newGene not in visited:
                # Mark new gene as visited
                visited.add(newGene)
                # Enqueue the new gene string with incremented mutation count
                queue.append((newGene, currentMutations + 1))

# If the end gene is not reached, return -1
return -1

By using the described BFS approach, we ensure that we investigate all possible mutations leading us to the minimum number of mutations needed. This solution is efficient given the constraints and guarantees that the shortest path to the target gene is found.