Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

GPSR QA & Repeat states #140

Merged
merged 24 commits into from
Mar 11, 2024
Merged
Show file tree
Hide file tree
Changes from 16 commits
Commits
Show all changes
24 commits
Select commit Hold shift + click to select a range
5d6e21c
data: add 2023 robocup gpsr xml files
m-barker Mar 3, 2024
4cd6361
feat: xml parser for gpsr q/a task component
m-barker Mar 3, 2024
4c049d6
fix: require install of requirements.tt
m-barker Mar 3, 2024
0673914
feat: add backend for creating & querying vector db
m-barker Mar 4, 2024
e8d898a
feat: add sentence embedding utils
m-barker Mar 4, 2024
b4a4ce8
feat: service to create text FAISS index
m-barker Mar 5, 2024
3d3007c
feat: text query service for FAISS
m-barker Mar 5, 2024
898ed1d
feat: working FAISS text services
m-barker Mar 5, 2024
04ddae3
feat: test scripts for FAISS services
m-barker Mar 5, 2024
7321696
docs: add documenation for FAISS vector service
m-barker Mar 5, 2024
86b964b
chore: remove xml files
m-barker Mar 5, 2024
db0750f
feat: xml question answer state
m-barker Mar 6, 2024
9d8a9f1
feat: separate package for vector db messages
m-barker Mar 6, 2024
b012e23
feat: working state machine for gpsr QA task
m-barker Mar 6, 2024
014c6e9
feat: tts question answering
m-barker Mar 6, 2024
e234f9d
feat: working launch file and quesiton answering with TTS
m-barker Mar 6, 2024
d726542
fix: integrate @jws-1 review suggestions
m-barker Mar 11, 2024
397ac6f
feat: add listen state
m-barker Mar 11, 2024
85f5439
chore: create gpsr commands sub folder
m-barker Mar 11, 2024
2c8f257
chore: properly fix ALSA errors
m-barker Mar 11, 2024
d6dde82
feat: speech and voice skills
m-barker Mar 11, 2024
e41b4dd
feat: Q/A skill using new speech/voice skills
m-barker Mar 11, 2024
d7a9b22
fix: working new question answer state machine
m-barker Mar 11, 2024
c2690f1
Merge branch 'main' into gpsr_question_answer
jws-1 Mar 11, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
42 changes: 16 additions & 26 deletions common/vector_databases/lasr_vector_databases_faiss/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,10 @@ project(lasr_vector_databases_faiss)
## Find catkin macros and libraries
## if COMPONENTS list like find_package(catkin REQUIRED COMPONENTS xyz)
## is used, also find other catkin packages
find_package(catkin REQUIRED catkin_virtualenv)
find_package(catkin REQUIRED catkin_virtualenv COMPONENTS
rospy
lasr_vector_databases_msgs
)

## System dependencies are found with CMake's conventions
# find_package(Boost REQUIRED COMPONENTS system)
Expand Down Expand Up @@ -55,8 +58,6 @@ catkin_generate_virtualenv(
## Generate services in the 'srv' folder
# add_service_files(
# FILES
# Service1.srv
# Service2.srv
# )

# Generate actions in the 'action' folder
Expand All @@ -68,8 +69,7 @@ catkin_generate_virtualenv(
# Generate added messages and services with any dependencies listed here
# generate_messages(
# DEPENDENCIES
# actionlib_msgs
# geometry_msgs
# std_msgs
# )

################################################
Expand Down Expand Up @@ -157,22 +157,13 @@ include_directories(

## Mark executable scripts (Python etc.) for installation
## in contrast to setup.py, you can choose the destination
# catkin_install_python(PROGRAMS
# nodes/qualification
# nodes/actions/wait_greet
# nodes/actions/identify
# nodes/actions/greet
# nodes/actions/get_name
# nodes/actions/learn_face
# nodes/actions/get_command
# nodes/actions/guide
# nodes/actions/find_person
# nodes/actions/detect_people
# nodes/actions/receive_object
# nodes/actions/handover_object
# nodes/better_qualification
# DESTINATION ${CATKIN_PACKAGE_BIN_DESTINATION}
# )
catkin_install_python(PROGRAMS
nodes/txt_index_service
nodes/txt_query_service
scripts/test_index_service.py
scripts/test_query_service.py
DESTINATION ${CATKIN_PACKAGE_BIN_DESTINATION}
)

## Mark executables for installation
## See http://docs.ros.org/melodic/api/catkin/html/howto/format1/building_executables.html
Expand All @@ -196,11 +187,10 @@ include_directories(
# )

## Mark other files for installation (e.g. launch and bag files, etc.)
# install(FILES
# # myfile1
# # myfile2
# DESTINATION ${CATKIN_PACKAGE_SHARE_DESTINATION}
# )
install(FILES
requirements.txt
DESTINATION ${CATKIN_PACKAGE_SHARE_DESTINATION}
)

#############
## Testing ##
Expand Down
Empty file.
33 changes: 33 additions & 0 deletions common/vector_databases/lasr_vector_databases_faiss/doc/USAGE.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
This package currently contains two services `txt_index_service` and `txt_query_service`. These services are used to create and search (respectively) a vector database of natural language sentence embeddings.

# Index Service
The Index service is used to create a [FAISS](https://github.com/facebookresearch/faiss) index object containing a set of sentence embeddings, where each sentence is assumed to be a line in a given `.txt` file. This Index object is saved to disk at a specified location, and can be thought of as a Vector Database.

## Request
The request takes two string parameters: `txt_path` which is the path to the `.txt` file we wish to create sentence embeddings for, where each line in this file is treated as a sentence; and `index_path` which is the path to a `.index` file that will be created by the Service.

## Response
No response is given from this service.

## Example Usage
Please see the `scripts/test_index_service.py` script for a simple example of sending a request to the service.

# Query Service
The query service is used to search the `.index` file created by the Index Service to find the most similar sentences given an input query sentence.

## Request
The request requires four fields:

1. `txt_path` -- this is a `string` that is the path to the txt file that contains the original sentences that the `.index` file was populated with.
2. `index_path` -- this is a `string` that is the path to the `.index` file that was created with the Index Service, on the same txt file as the `txt_path`.
3. `query_sentence` -- this is a `string` that is the sentence that you wish to query the index with and find the most similar sentence.
4. `k` -- this is a `uint8` that is the number of closest sentences you wish to return.

## Response
The response contains two fields:

1. `closest_sentences` -- this is an ordered list of `string`s that contain the closest sentences to the given query sentence.
2. `cosine_similaities` -- this is an ordered list of `float32`s that contain the cosine similarity scores of the closest sentences.

## Example Usage
Please see the `scripts/test_query_service.py` script for a simple example of sending a request to the service.
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
#!/usr/bin/env python3
import rospy
import numpy as np
from lasr_vector_databases_msgs.srv import TxtIndexRequest, TxtIndexResponse, TxtIndex
from lasr_vector_databases_faiss import (
load_model,
parse_txt_file,
get_sentence_embeddings,
create_vector_database,
)


class TxtIndexService:
def __init__(self):
rospy.init_node("txt_index_service")
m-barker marked this conversation as resolved.
Show resolved Hide resolved
rospy.Service("lasr_faiss/txt_index", TxtIndex, self.execute_cb)
self._sentence_embedding_model = load_model()
rospy.loginfo("Text index service started")

def execute_cb(self, req: TxtIndexRequest):
txt_fp: str = req.txt_path
sentences_to_embed: list[str] = parse_txt_file(txt_fp)
sentence_embeddings: np.ndarray = get_sentence_embeddings(
sentences_to_embed, self._sentence_embedding_model
)
index_path: str = req.index_path
create_vector_database(sentence_embeddings, index_path)
return TxtIndexResponse()


if __name__ == "__main__":
TxtIndexService()
rospy.spin()
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
#!/usr/bin/env python3
import rospy
import numpy as np

from lasr_vector_databases_msgs.srv import (
TxtQueryRequest,
TxtQueryResponse,
TxtQuery,
)
from lasr_vector_databases_faiss import (
load_model,
parse_txt_file,
get_sentence_embeddings,
load_vector_database,
query_database,
)


class TxtQueryService:
def __init__(self):
rospy.init_node("txt_query_service")
m-barker marked this conversation as resolved.
Show resolved Hide resolved
self._sentence_embedding_model = load_model()
print(self._sentence_embedding_model)
m-barker marked this conversation as resolved.
Show resolved Hide resolved
rospy.Service("lasr_faiss/txt_query", TxtQuery, self.execute_cb)
rospy.loginfo("Text Query service started")

def execute_cb(self, req: TxtQueryRequest) -> TxtQueryResponse:
txt_fp: str = req.txt_path
index_path: str = req.index_path
query_sentence: str = req.query_sentence
possible_matches: list[str] = parse_txt_file(txt_fp)
query_embedding: np.ndarray = get_sentence_embeddings(
[query_sentence], self._sentence_embedding_model # requires list of strings
)
distances, indices = query_database(index_path, query_embedding, k=req.k)
nearest_matches = [possible_matches[i] for i in indices[0]]

return TxtQueryResponse(
closest_sentences=nearest_matches,
cosine_similarities=distances[0].tolist(),
)


if __name__ == "__main__":
TxtQueryService()
rospy.spin()
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,7 @@
<!-- <doc_depend>doxygen</doc_depend> -->
<buildtool_depend>catkin</buildtool_depend>
<build_depend>catkin_virtualenv</build_depend>
<depend>lasr_vector_databases_msgs</depend>
<!-- The export tag contains other, unspecified, tags -->
<export>
<!-- Other tools can request additional information be placed here -->
Expand Down
Original file line number Diff line number Diff line change
@@ -1 +1,3 @@
faiss-cpu
faiss-cpu
sentence-transformers
torch
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
#!/usr/bin/env python3
import rospy
from lasr_vector_databases_faiss.srv import TxtIndex, TxtIndexRequest

request = TxtIndexRequest()

request.txt_path = (
"/home/mattbarker/LASR/lasr_ws/src/lasr-base/tasks/gpsr/data/questions.txt"
)

request.index_path = (
"/home/mattbarker/LASR/lasr_ws/src/lasr-base/tasks/gpsr/data/questions.index"
)
rospy.ServiceProxy("lasr_faiss/txt_index", TxtIndex)(request)
Original file line number Diff line number Diff line change
@@ -0,0 +1,22 @@
#!/usr/bin/env python3
import rospy
from lasr_vector_databases_faiss.srv import TxtQuery, TxtQueryRequest

request = TxtQueryRequest()

request.txt_path = (
"/home/mattbarker/LASR/lasr_ws/src/lasr-base/tasks/gpsr/data/questions.txt"
)

request.index_path = (
"/home/mattbarker/LASR/lasr_ws/src/lasr-base/tasks/gpsr/data/questions.index"
)

request.query_sentence = "Do French like snails?"

request.k = 3

response = rospy.ServiceProxy("lasr_faiss/txt_query", TxtQuery)(request)

print(response.closest_sentences)
print(response.cosine_similarities)
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
from .database_utils import create_vector_database, load_vector_database, query_database
from .get_sentence_embeddings import get_sentence_embeddings, load_model, parse_txt_file
Loading
Loading