diff --git a/segmentation/__init__.py b/segmentation/__init__.py
new file mode 100644
index 0000000..ce1ea7c
--- /dev/null
+++ b/segmentation/__init__.py
@@ -0,0 +1,5 @@
+from .factory import get_segmenter
+
+__all__ = [
+    "get_segmenter",
+]
\ No newline at end of file
diff --git a/segmentation/base/__init__.py b/segmentation/base/__init__.py
new file mode 100644
index 0000000..bdbbd2b
--- /dev/null
+++ b/segmentation/base/__init__.py
@@ -0,0 +1,7 @@
+from .gazette_segment import GazetteSegment
+from .association_segmenter import AssociationSegmenter
+
+__all__ = [
+    "GazetteSegment",
+    "AssociationSegmenter",
+]
\ No newline at end of file
diff --git a/segmentation/base/association_segmenter.py b/segmentation/base/association_segmenter.py
new file mode 100644
index 0000000..cd1e99e
--- /dev/null
+++ b/segmentation/base/association_segmenter.py
@@ -0,0 +1,27 @@
+from typing import Union, Dict, List
+from segmentation.base import GazetteSegment
+
+
+class AssociationSegmenter:
+    def __init__(self, association_gazette: str):
+        self.association_gazette = association_gazette
+
+    def get_gazette_segments(self, *args, **kwargs) -> List[Union[GazetteSegment, Dict]]:
+        """
+        Returns a list of GazetteSegment
+        """
+        raise NotImplementedError
+
+    def split_text_by_territory(self, *args, **kwargs) -> Union[Dict[str, str], List[str]]:
+        """
+        Segment a association text by territory
+        and returns a list of text segments
+        """
+        raise NotImplementedError
+
+    def build_segment(self, *args, **kwargs) -> GazetteSegment:
+        """
+        Returns a GazetteSegment
+        """
+        raise NotImplementedError
+
diff --git a/segmentation/base/gazette_segment.py b/segmentation/base/gazette_segment.py
new file mode 100644
index 0000000..9343ced
--- /dev/null
+++ b/segmentation/base/gazette_segment.py
@@ -0,0 +1,26 @@
+from datetime import date, datetime
+from dataclasses import dataclass
+
+
+@dataclass
+class GazetteSegment:
+    """
+    Dataclass to represent a gazette segment of a association
+    related to a city
+    """
+    territory_name: str
+    source_text: str
+    date: date
+    edition_number: str
+    is_extra_edition: bool
+    power: str
+    file_checksum: str
+    scraped_at: datetime
+    created_at: datetime
+    processed: bool
+    file_path: str
+    file_url: str
+    state_code: str
+    territory_id: str
+    file_raw_txt: str
+    url: str
\ No newline at end of file
diff --git a/segmentation/factory.py b/segmentation/factory.py
new file mode 100644
index 0000000..583070c
--- /dev/null
+++ b/segmentation/factory.py
@@ -0,0 +1,42 @@
+from typing import Any
+
+from segmentation.base import AssociationSegmenter
+from segmentation import segmenters
+
+
+def get_segmenter(territory_id: str, association_gazzete: dict[str, Any]) -> AssociationSegmenter:
+    """
+    Factory method to return a AssociationSegmenter
+
+    Example
+    -------
+    >>> association_gazette = {
+        "territory_name": "Associação",
+        "created_at": datetime.datetime.now(),
+        "date": datetime.datetime.now(),
+        "edition_number": 1,
+        "file_path": 'raw/pdf.pdf',
+        "file_url": 'localhost:8000/raw/pdf.pdf',
+        "is_extra_edition": True,
+        "power": 'executive',
+        "scraped_at": datetime.datetime.now(),
+        "state_code": 'AL',
+        "source_text": texto,
+    }
+    >>> from segmentation import get_segmenter
+    >>> segmenter = get_segmenter(territory_id, association_gazette)
+    >>> segments = segmenter.get_gazette_segments()
+
+    Notes
+    -----
+    This method implements a factory method pattern.
+    See: https://github.com/faif/python-patterns/blob/master/patterns/creational/factory.py
+    """
+
+    territory_to_segmenter_class = {
+        "2700000": "ALAssociacaoMunicipiosSegmenter",
+    }
+
+    segmenter_class_name = territory_to_segmenter_class[territory_id]
+    segmenter_class = getattr(segmenters, segmenter_class_name)
+    return segmenter_class(association_gazzete)
diff --git a/segmentation/segmenters/__init__.py b/segmentation/segmenters/__init__.py
new file mode 100644
index 0000000..39de174
--- /dev/null
+++ b/segmentation/segmenters/__init__.py
@@ -0,0 +1,5 @@
+from .al_associacao_municipios import ALAssociacaoMunicipiosSegmenter
+
+__all__ = [
+    "ALAssociacaoMunicipiosSegmenter",
+]
\ No newline at end of file
diff --git a/segmentation/segmenters/al_associacao_municipios.py b/segmentation/segmenters/al_associacao_municipios.py
new file mode 100644
index 0000000..bcf93f3
--- /dev/null
+++ b/segmentation/segmenters/al_associacao_municipios.py
@@ -0,0 +1,136 @@
+import re
+
+from typing import Any
+from segmentation.base import AssociationSegmenter, GazetteSegment
+from tasks.utils import get_checksum
+
+class ALAssociacaoMunicipiosSegmenter(AssociationSegmenter):
+    def __init__(self, association_gazzete: dict[str, Any]):
+        super().__init__(association_gazzete)
+        # No final do regex, existe uma estrutura condicional que verifica se o próximo match é um \s ou SECRETARIA. Isso foi feito para resolver um problema no diário de 2018-10-02, em que o município de Coité do Nóia não foi percebido pelo código. Para resolver isso, utilizamos a próxima palavra (SECRETARIA) para tratar esse caso.
+        # Exceções Notáveis
+        # String: VAMOS, município Poço das Trincheiras, 06/01/2022, ato CCB3A6AB
+        self.RE_NOMES_MUNICIPIOS = (
+            r"ESTADO DE ALAGOAS(?:| )\n{1,2}PREFEITURA MUNICIPAL DE (.*\n{0,2}(?!VAMOS).*$)\n\s(?:\s|SECRETARIA)"
+        )
+        self.association_source_text = self.association_gazette["source_text"]
+
+    def get_gazette_segments(self) -> list[dict[str, Any]]:
+        """
+        Returns a list of dicts with the gazettes metadata
+        """
+        territory_to_text_split = self.split_text_by_territory()
+        gazette_segments = []
+        for municipio, texto_diario in territory_to_text_split.items():
+            segmento = self.build_segment(municipio, texto_diario)
+            gazette_segments.append(segmento.__dict__)
+        return gazette_segments
+
+    def split_text_by_territory(self) -> dict[str, str]:
+        """
+        Segment a association text by territory
+        and returns a dict with the territory name and the text segment
+        """
+        texto_diario_slice = self.association_source_text.lstrip().splitlines()
+
+        # Processamento
+        linhas_apagar = []  # slice de linhas a ser apagadas ao final.
+        ama_header = texto_diario_slice[0]
+        ama_header_count = 0
+        codigo_count = 0
+        codigo_total = self.association_source_text.count("Código Identificador")
+
+        for num_linha, linha in enumerate(texto_diario_slice):
+            # Remoção do cabeçalho AMA, porém temos que manter a primeira aparição.
+            if linha.startswith(ama_header):
+                ama_header_count += 1
+                if ama_header_count > 1:
+                    linhas_apagar.append(num_linha)
+
+            # Remoção das linhas finais
+            if codigo_count == codigo_total:
+                linhas_apagar.append(num_linha)
+            elif linha.startswith("Código Identificador"):
+                codigo_count += 1
+
+        # Apagando linhas do slice
+        texto_diario_slice = [l for n, l in enumerate(
+            texto_diario_slice) if n not in linhas_apagar]
+
+        # Inserindo o cabeçalho no diário de cada município.
+        territory_to_text_split = {}
+        nomes_municipios = re.findall(
+            self.RE_NOMES_MUNICIPIOS, self.association_source_text, re.MULTILINE)
+        for municipio in nomes_municipios:
+            nome_municipio_normalizado = self._normalize_territory_name(municipio)
+            territory_to_text_split[nome_municipio_normalizado] = ama_header + '\n\n'
+
+        num_linha = 0
+        municipio_atual = None
+        while num_linha < len(texto_diario_slice):
+            linha = texto_diario_slice[num_linha].rstrip()
+
+            if linha.startswith("ESTADO DE ALAGOAS"):
+                nome = self._extract_territory_name(texto_diario_slice, num_linha)
+                if nome is not None:
+                    nome_normalizado = self._normalize_territory_name(nome)
+                    municipio_atual = nome_normalizado
+
+            # Só começa, quando algum muncípio for encontrado.
+            if municipio_atual is None:
+                num_linha += 1
+                continue
+
+            # Conteúdo faz parte de um muncípio
+            territory_to_text_split[municipio_atual] += linha + '\n'
+            num_linha += 1
+
+        return territory_to_text_split
+
+    def build_segment(self, territory, segment_text) -> GazetteSegment:
+        file_checksum = get_checksum(segment_text)
+        processed = True
+        territory_name = territory
+        source_text = segment_text.rstrip()
+        
+        # TODO: get territory data and replace the None values
+        territory_id = None
+        # file_raw_txt = f"/{territory_id}/{date}/{file_checksum}.txt"
+        file_raw_txt = None
+        # url = file_raw_txt
+        url = None
+        
+        return GazetteSegment(
+            # same association values
+            created_at=self.association_gazette.get("created_at"),
+            date=self.association_gazette.get("date"),
+            edition_number=self.association_gazette.get("edition_number"),
+            file_path=self.association_gazette.get("file_path"),
+            file_url=self.association_gazette.get("file_url"),
+            is_extra_edition=self.association_gazette.get("is_extra_edition"),
+            power=self.association_gazette.get("power"),
+            scraped_at=self.association_gazette.get("scraped_at"),
+            state_code=self.association_gazette.get("state_code"),
+            url=self.association_gazette.get("url"),
+
+            # segment specific values
+            file_checksum=file_checksum,
+            processed=processed,
+            territory_name=territory_name,
+            source_text=source_text,
+            territory_id=territory_id,
+            file_raw_txt=file_raw_txt,
+        )
+
+    def _normalize_territory_name(self, municipio: str) -> str:
+        municipio = municipio.rstrip().replace('\n', '')  # limpeza inicial
+        # Alguns nomes de municípios possuem um /AL no final, exemplo: Viçosa no diário 2022-01-17, ato 8496EC0A. Para evitar erros como "vicosa-/al-secretaria-municipal...", a linha seguir remove isso. 
+        municipio = re.sub("(\/AL.*|GABINETE DO PREFEITO.*|PODER.*|http.*|PORTARIA.*|Extrato.*|ATA DE.*|SECRETARIA.*|Fundo.*|SETOR.*|ERRATA.*|- AL.*|GABINETE.*)", "", municipio)
+        return municipio
+
+    def _extract_territory_name(self, texto_diario_slice: list[str], num_linha: int):
+        texto = '\n'.join(texto_diario_slice[num_linha:num_linha+10])
+        match = re.findall(self.RE_NOMES_MUNICIPIOS, texto, re.MULTILINE)
+        if len(match) > 0:
+            return match[0].strip().replace('\n', '')
+        return None
diff --git a/tasks/__init__.py b/tasks/__init__.py
index b738481..6d27f79 100644
--- a/tasks/__init__.py
+++ b/tasks/__init__.py
@@ -11,4 +11,4 @@
 )
 from .list_gazettes_to_be_processed import get_gazettes_to_be_processed
 from .list_territories import get_territories_gazettes
-
+from .get_territorie_info import get_territorie_info
diff --git a/tasks/diario_ama.py b/tasks/diario_ama.py
deleted file mode 100644
index 51e9cd3..0000000
--- a/tasks/diario_ama.py
+++ /dev/null
@@ -1,78 +0,0 @@
-import re
-
-from .diario_municipal import Diario, Municipio
-
-# No final do regex, existe uma estrutura condicional que verifica se o próximo match é um \s ou SECRETARIA. Isso foi feito para resolver um problema no diário de 2018-10-02, em que o município de Coité do Nóia não foi percebido pelo código. Para resolver isso, utilizamos a próxima palavra (SECRETARIA) para tratar esse caso.
-# Exceções Notáveis
-# String: VAMOS, município Poço das Trincheiras, 06/01/2022, ato CCB3A6AB
-re_nomes_municipios = (
-    r"ESTADO DE ALAGOAS(?:| )\n{1,2}PREFEITURA MUNICIPAL DE (.*\n{0,2}(?!VAMOS).*$)\n\s(?:\s|SECRETARIA)")
-
-
-def extrair_diarios_municipais(texto_diario: str, pdf_path: dict, territories: list):
-    texto_diario_slice = texto_diario.lstrip().splitlines()
-
-    # Processamento
-    linhas_apagar = []  # slice de linhas a ser apagadas ao final.
-    ama_header = texto_diario_slice[0]
-    ama_header_count = 0
-    codigo_count = 0
-    codigo_total = texto_diario.count("Código Identificador")
-
-    for num_linha, linha in enumerate(texto_diario_slice):
-        # Remoção do cabeçalho AMA, porém temos que manter a primeira aparição.
-        if linha.startswith(ama_header):
-            ama_header_count += 1
-            if ama_header_count > 1:
-                linhas_apagar.append(num_linha)
-
-        # Remoção das linhas finais
-        if codigo_count == codigo_total:
-            linhas_apagar.append(num_linha)
-        elif linha.startswith("Código Identificador"):
-            codigo_count += 1
-
-    # Apagando linhas do slice
-    texto_diario_slice = [l for n, l in enumerate(
-        texto_diario_slice) if n not in linhas_apagar]
-
-    # Inserindo o cabeçalho no diário de cada município.
-    texto_diarios = {}
-    nomes_municipios = re.findall(
-        re_nomes_municipios, texto_diario, re.MULTILINE)
-    for municipio in nomes_municipios:
-        municipio = Municipio(municipio)
-        texto_diarios[municipio] = ama_header + '\n\n'
-
-    num_linha = 0
-    municipio_atual = None
-    while num_linha < len(texto_diario_slice):
-        linha = texto_diario_slice[num_linha].rstrip()
-
-        if linha.startswith("ESTADO DE ALAGOAS"):
-            nome = nome_municipio(texto_diario_slice, num_linha)
-            if nome is not None:
-                municipio_atual = Municipio(nome)
-
-        # Só começa, quando algum muncípio for encontrado.
-        if municipio_atual is None:
-            num_linha += 1
-            continue
-
-        # Conteúdo faz parte de um muncípio
-        texto_diarios[municipio_atual] += linha + '\n'
-        num_linha += 1
-
-    diarios = []
-    for municipio, diario in texto_diarios.items():
-        diarios.append(Diario(municipio, ama_header, diario, pdf_path, territories).__dict__)
-
-    return diarios
-
-
-def nome_municipio(texto_diario_slice: slice, num_linha: int):
-    texto = '\n'.join(texto_diario_slice[num_linha:num_linha+10])
-    match = re.findall(re_nomes_municipios, texto, re.MULTILINE)
-    if len(match) > 0:
-        return match[0].strip().replace('\n', '')
-    return None
diff --git a/tasks/diario_municipal.py b/tasks/diario_municipal.py
deleted file mode 100644
index a215802..0000000
--- a/tasks/diario_municipal.py
+++ /dev/null
@@ -1,102 +0,0 @@
-import json
-import re
-import unicodedata
-from datetime import date, datetime
-from .get_territorie_info import get_territorie_info
-import hashlib
-from io import BytesIO
-
-
-class Municipio:
-
-    def __init__(self, municipio):
-        municipio = municipio.rstrip().replace('\n', '')  # limpeza inicial
-        # Alguns nomes de municípios possuem um /AL no final, exemplo: Viçosa no diário 2022-01-17, ato 8496EC0A. Para evitar erros como "vicosa-/al-secretaria-municipal...", a linha seguir remove isso. 
-        municipio = re.sub("(\/AL.*|GABINETE DO PREFEITO.*|PODER.*|http.*|PORTARIA.*|Extrato.*|ATA DE.*|SECRETARIA.*|Fundo.*|SETOR.*|ERRATA.*|- AL.*|GABINETE.*)", "", municipio)
-        self.id = self._computa_id(municipio)
-        self.nome = municipio
-
-    def _computa_id(self, nome_municipio):
-        ret = nome_municipio.strip().lower().replace(" ", "-")
-        ret = unicodedata.normalize('NFKD', ret)
-        ret = ret.encode('ASCII', 'ignore').decode("utf-8")
-        return ret
-
-    def __hash__(self):
-        return hash(self.id)
-
-    def __eq__(self, other):
-        return self.id == other.id
-
-    def __str__(self):
-        return json.dumps(self.__dict__, indent=2, default=str, ensure_ascii=False)
-
-
-class Diario:
-
-    _mapa_meses = {
-        "Janeiro": 1,
-        "Fevereiro": 2,
-        "Março": 3,
-        "Abril": 4,
-        "Maio": 5,
-        "Junho": 6,
-        "Julho": 7,
-        "Agosto": 8,
-        "Setembro": 9,
-        "Outubro": 10,
-        "Novembro": 11,
-        "Dezembro": 12,
-    }
-
-    def __init__(self, municipio: Municipio, cabecalho: str, texto: str, pdf_path: dict, territories: list):
-
-        self.territory_id, self.territory_name, self.state_code = get_territorie_info(
-            name=municipio.nome,
-            state=cabecalho.split(",")[0],
-            territories=territories)
-
-        self.source_text = texto.rstrip()
-        self.date = self._extrai_data_publicacao(cabecalho)
-        self.edition_number = cabecalho.split("Nº")[1].strip()
-        self.is_extra_edition = False
-        self.power = "executive_legislative"
-        self.file_url = pdf_path["file_url"]
-        self.file_path = pdf_path["file_path"]
-        self.file_checksum = self.md5sum(BytesIO(self.source_text.encode(encoding='UTF-8')))
-        self.scraped_at = datetime.utcnow()
-        self.created_at = self.scraped_at
-        # file_endpoint = gazette_text_extraction.get_file_endpoint()
-        self.file_raw_txt = f"/{self.territory_id}/{self.date}/{self.file_checksum}.txt"
-        self.processed = True
-        self.url = self.file_raw_txt
-
-    def _extrai_data_publicacao(self, ama_header: str):
-        match = re.findall(
-            r".*(\d{2}) de (\w*) de (\d{4})", ama_header, re.MULTILINE)[0]
-        mes = Diario._mapa_meses[match[1]]
-        return date(year=int(match[2]), month=mes, day=int(match[0]))
-
-    def md5sum(self, file):
-        """Calculate the md5 checksum of a file-like object without reading its
-        whole content in memory.
-        from io import BytesIO
-        md5sum(BytesIO(b'file content to hash'))
-        '784406af91dd5a54fbb9c84c2236595a'
-        """
-        m = hashlib.md5()
-        while True:
-            d = file.read(8096)
-            if not d:
-                break
-            m.update(d)
-        return m.hexdigest()
-
-    def __hash__(self):
-        return hash(self.id)
-
-    def __eq__(self, other):
-        return self.id == other.id
-
-    def __str__(self):
-        return dict(self.__dict__)
diff --git a/tasks/utils/__init__.py b/tasks/utils/__init__.py
index 1bd9cf3..ae62c3a 100644
--- a/tasks/utils/__init__.py
+++ b/tasks/utils/__init__.py
@@ -2,4 +2,7 @@
     get_documents_from_query_with_highlights,
     get_documents_with_ids,
 )
-from .text import clean_extra_whitespaces
+from .text import (
+    clean_extra_whitespaces,
+    get_checksum,
+)
\ No newline at end of file
diff --git a/tasks/utils/text.py b/tasks/utils/text.py
index 1cc7c39..7d40bca 100644
--- a/tasks/utils/text.py
+++ b/tasks/utils/text.py
@@ -1,5 +1,28 @@
 import re
+import hashlib
+from io import BytesIO
 
 
 def clean_extra_whitespaces(text: str) -> str:
     return re.sub(r"\s+", " ", text)
+
+
+def get_checksum(source_text: str) -> str:
+    """Calculate the md5 checksum of text
+    by creating a file-like object without reading its
+    whole content in memory.
+
+    Example
+    -------
+    >>> extractor.get_checksum("A simple text")
+        'ef313f200597d0a1749533ba6aeb002e'
+    """
+    file = BytesIO(source_text.encode(encoding="UTF-8"))
+
+    m = hashlib.md5()
+    while True:
+        d = file.read(8096)
+        if not d:
+            break
+        m.update(d)
+    return m.hexdigest()
\ No newline at end of file