Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Fix/window event race condition #842

Open
wants to merge 43 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from 19 commits
Commits
Show all changes
43 commits
Select commit Hold shift + click to select a range
4f68487
add joinedload to eagerly load related entities
Animesh404 Jul 3, 2024
85d0100
change get_active_window_data to return empty dict when state is none
Animesh404 Jul 4, 2024
1feea90
add eager as parameter in _get
Animesh404 Jul 4, 2024
418fdef
chore: try pygetwindows
Animesh404 Jul 5, 2024
3410e32
window-event performance test
Animesh404 Jul 8, 2024
b0a66ed
remove unwanted changes from other files
Animesh404 Jul 8, 2024
7ad454b
Merge branch 'main' into fix/WindowEvent-race-condition
Animesh404 Jul 8, 2024
51986f7
fix: add new A11yEvent model
Animesh404 Jul 16, 2024
8b0937d
Merge branch 'main' into fix/WindowEvent-race-condition
Animesh404 Jul 16, 2024
bba8101
remove unnecessary comment
Animesh404 Jul 16, 2024
f770251
Merge branch 'fix/WindowEvent-race-condition' of https://github.com/A…
Animesh404 Jul 16, 2024
a9ecc15
fix: change WindowEvent Model
Animesh404 Jul 16, 2024
ed43695
fixing crud and record.py for a11yevents
Animesh404 Jul 16, 2024
1543390
remove unnecessary test file as we are not using pygetwindow
Animesh404 Jul 16, 2024
28fe26d
fix: fixing data removal logic in WindowEvent model
Animesh404 Jul 17, 2024
8dabc63
add handle and remove window_id
Animesh404 Jul 18, 2024
bbe0c47
chore: db revision
Animesh404 Jul 18, 2024
488bf4b
fix: remove state from window_event and add a11y_counter
Animesh404 Jul 21, 2024
e89710c
remove state from window_event
Animesh404 Jul 22, 2024
574e133
fix: add a11y_event in visualize
Animesh404 Jul 23, 2024
51db67d
Merge branch 'main' into fix/WindowEvent-race-condition
Animesh404 Jul 23, 2024
6e60017
fix: replay error fix and black error fix
Animesh404 Jul 23, 2024
950c1a0
Merge branch 'main' of https://github.com/OpenAdaptAI/OpenAdapt into …
Animesh404 Jul 23, 2024
8b125e4
fix: formatting
Animesh404 Jul 23, 2024
4841c50
Merge branch 'fix/WindowEvent-race-condition' of https://github.com/A…
Animesh404 Jul 23, 2024
31c270f
fix: flake8 error
Animesh404 Jul 23, 2024
32a42ec
Update models.py
abrichr Jul 24, 2024
27e8c75
Update record.py: add a11y_event_reader
abrichr Jul 24, 2024
db6b05a
fix: add read_a11y_data in config
Animesh404 Jul 25, 2024
b275f35
conflict resolve
Animesh404 Jul 25, 2024
6623bb9
resolve conflicts
Animesh404 Jul 25, 2024
597f6c0
remove unnecessry comments and items
Animesh404 Jul 25, 2024
403750a
remove duplicate values from merge resolution
Animesh404 Jul 25, 2024
1148967
rename RECORD_WINDOW_DATA to RECORD_A11Y_DATA and state to a11y_data
Animesh404 Jul 25, 2024
85e23bb
fix: change to_prompt_dict in WindowEvent
Animesh404 Jul 25, 2024
5bfb833
resolve conflict
Animesh404 Jul 25, 2024
d402968
change to_prompt_dict in WindowEvent model
Animesh404 Jul 25, 2024
4147c1c
Merge branch 'main' into fix/WindowEvent-race-condition
Animesh404 Jul 25, 2024
25b830a
update to_prompt_dict
Animesh404 Jul 25, 2024
bf04f51
Merge branch 'fix/WindowEvent-race-condition' of https://github.com/A…
Animesh404 Jul 25, 2024
8c0d2e6
add a11y_data in dashboard
Animesh404 Jul 26, 2024
78ae338
Merge branch 'main' into fix/WindowEvent-race-condition
Animesh404 Jul 26, 2024
3b0ada0
use pygetwindow for window and pywinauto for a11y and display a11y on…
Animesh404 Jul 29, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -0,0 +1,47 @@
"""add_a11y_event_remove_state_from_window_event

Revision ID: 0884b45e71e9
Revises: bb25e889ad71
Create Date: 2024-07-22 18:16:45.133921

"""
from alembic import op
import sqlalchemy as sa
from sqlalchemy.dialects import sqlite

# revision identifiers, used by Alembic.
revision = '0884b45e71e9'
down_revision = 'bb25e889ad71'
branch_labels = None
depends_on = None


def upgrade() -> None:
# ### commands auto generated by Alembic - please adjust! ###
op.create_table('a11y_event',
sa.Column('id', sa.Integer(), nullable=False),
sa.Column('handle', sa.Integer(), nullable=False),
sa.Column('data', sa.JSON(), nullable=True),
sa.Column('a11y_counter', sa.Integer(), nullable=True),
sa.ForeignKeyConstraint(['handle'], ['window_event.handle'], name=op.f('fk_a11y_event_handle_window_event')),
sa.PrimaryKeyConstraint('id', name=op.f('pk_a11y_event'))
)
with op.batch_alter_table('window_event', schema=None) as batch_op:
batch_op.add_column(sa.Column('handle', sa.Integer(), nullable=True))
batch_op.add_column(sa.Column('a11y_counter', sa.Integer(), nullable=True))
batch_op.drop_column('state')
batch_op.drop_column('window_id')

# ### end Alembic commands ###


def downgrade() -> None:
# ### commands auto generated by Alembic - please adjust! ###
with op.batch_alter_table('window_event', schema=None) as batch_op:
batch_op.add_column(sa.Column('window_id', sa.VARCHAR(), nullable=True))
batch_op.add_column(sa.Column('state', sqlite.JSON(), nullable=True))
batch_op.drop_column('a11y_counter')
batch_op.drop_column('handle')

op.drop_table('a11y_event')
# ### end Alembic commands ###
24 changes: 24 additions & 0 deletions openadapt/db/crud.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,6 +28,7 @@
Screenshot,
ScrubbedRecording,
WindowEvent,
A11yEvent,
copy_sa_instance,
)
from openadapt.privacy.base import ScrubbingProvider
Expand Down Expand Up @@ -263,6 +264,29 @@ def insert_recording(session: SaSession, recording_data: dict) -> Recording:
return db_obj


def insert_a11y_event(
db: SaSession,
data: dict,
) -> None:
"""Insert an a11y event into the database.

Args:
db: The database session.
data: The data associated with the a11y event.
"""
handle = data["handle"]
a11y_data = data["state"]
a11y_counter = data["a11y_counter"]

a11y_event = A11yEvent(
handle=handle,
data=a11y_data,
a11y_counter=a11y_counter
)
db.add(a11y_event)
db.commit()


def delete_recording(session: SaSession, recording: Recording) -> None:
"""Remove the recording from the db.

Expand Down
34 changes: 31 additions & 3 deletions openadapt/models.py
Original file line number Diff line number Diff line change
Expand Up @@ -492,6 +492,24 @@ def to_prompt_dict(self) -> dict[str, Any]:
return action_dict


class A11yEvent(db.Base):
"""Class representing an accessibility (a11y) event in the database."""

__tablename__ = "a11y_event"

id = sa.Column(sa.Integer, primary_key=True)
handle = sa.Column(sa.ForeignKey("window_event.handle"), nullable=False)
data = sa.Column(sa.JSON)
a11y_counter = sa.Column(sa.Integer)

window_event = sa.orm.relationship("WindowEvent", back_populates="a11y_events")

def __init__(self, handle, data, a11y_counter=None):
self.handle = handle
self.data = data
self.a11y_counter = a11y_counter


class WindowEvent(db.Base):
"""Class representing a window event in the database."""

Expand All @@ -501,16 +519,17 @@ class WindowEvent(db.Base):
recording_timestamp = sa.Column(ForceFloat)
recording_id = sa.Column(sa.ForeignKey("recording.id"))
timestamp = sa.Column(ForceFloat)
state = sa.Column(sa.JSON)
title = sa.Column(sa.String)
left = sa.Column(sa.Integer)
top = sa.Column(sa.Integer)
width = sa.Column(sa.Integer)
height = sa.Column(sa.Integer)
window_id = sa.Column(sa.String)
handle = sa.Column(sa.Integer)
a11y_counter = sa.Column(sa.Integer)
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved

recording = sa.orm.relationship("Recording", back_populates="window_events")
action_events = sa.orm.relationship("ActionEvent", back_populates="window_event")
a11y_events = sa.orm.relationship("A11yEvent", back_populates="window_event")

@classmethod
def get_active_window_event(
Expand All @@ -526,7 +545,16 @@ def get_active_window_event(
Returns:
(WindowEvent) the active window event.
"""
return WindowEvent(**window.get_active_window_data(include_window_data))
window_event_data = window.get_active_window_data(include_window_data)

a11y_event_data = window_event_data.get("state", {}).copy()
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved
window_event_data.pop("state", None)
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved
a11y_event_handle = window_event_data.get("handle")
a11y_event = A11yEvent(data=a11y_event_data, handle=a11y_event_handle)
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved
window_event = WindowEvent(**window_event_data)
window_event.a11y_events.append(a11y_event)

return window_event

def scrub(self, scrubber: ScrubbingProvider | TextScrubbingMixin) -> None:
"""Scrub the window event."""
Expand Down
114 changes: 102 additions & 12 deletions openadapt/record.py
Original file line number Diff line number Diff line change
Expand Up @@ -45,14 +45,15 @@

Event = namedtuple("Event", ("timestamp", "type", "data"))

EVENT_TYPES = ("screen", "action", "window")
EVENT_TYPES = ("screen", "action", "window", "a11y")
LOG_LEVEL = "INFO"
# whether to write events of each type in a separate process
PROC_WRITE_BY_EVENT_TYPE = {
"screen": True,
"screen/video": True,
"action": True,
"window": True,
"a11y": True,
}
PLOT_PERFORMANCE = config.PLOT_PERFORMANCE
NUM_MEMORY_STATS_TO_LOG = 3
Expand Down Expand Up @@ -128,6 +129,7 @@ def process_events(
screen_write_q: sq.SynchronizedQueue,
action_write_q: sq.SynchronizedQueue,
window_write_q: sq.SynchronizedQueue,
a11y_write_q: sq.SynchronizedQueue,
video_write_q: sq.SynchronizedQueue,
perf_q: sq.SynchronizedQueue,
recording: Recording,
Expand All @@ -136,7 +138,9 @@ def process_events(
num_screen_events: multiprocessing.Value,
num_action_events: multiprocessing.Value,
num_window_events: multiprocessing.Value,
num_a11y_events: multiprocessing.Value,
num_video_events: multiprocessing.Value,
window_event_by_id: dict,
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved
) -> None:
"""Process events from the event queue and write them to write queues.

Expand Down Expand Up @@ -167,6 +171,9 @@ def process_events(
started = False
while not terminate_processing.is_set() or not event_q.empty():
event = event_q.get()
if event.type == "window" or event.type == "a11y":
handle = event.data["handle"]
a11y_counter = event.data["a11y_counter"]
if not started:
with started_counter.get_lock():
started_counter.value += 1
Expand Down Expand Up @@ -244,6 +251,24 @@ def process_events(
)
num_window_events.value += 1
prev_saved_window_timestamp = prev_window_event.timestamp
elif event.type == "a11y":
window_event = window_event_by_id[(handle, a11y_counter)]
logger.debug(f"Processing A11yEvent: {event}")
if not window_event:
logger.warning(
f"Discarding A11yEvent with no corresponding WindowEvent: {event}"
)
continue
event.data["window_event_timestamp"] = window_event.timestamp
process_event(
event,
a11y_write_q,
write_a11y_event,
recording,
perf_q,
)
num_a11y_events.value += 1
logger.debug(f"A11yEvent processed: {event}")
else:
raise Exception(f"unhandled {event.type=}")
del prev_event
Expand Down Expand Up @@ -312,7 +337,26 @@ def write_window_event(
perf_q: A queue for collecting performance data.
"""
assert event.type == "window", event
crud.insert_window_event(db, recording, event.timestamp, event.data)
data = event.data
crud.insert_window_event(db, recording, event.timestamp, data)
perf_q.put((event.type, event.timestamp, utils.get_timestamp()))


def write_a11y_event(
db: crud.SaSession,
recording: Recording,
event: Event,
perf_q: sq.SynchronizedQueue,
) -> None:
"""Write an accessibility (a11y) event to the database and update the performance queue.

Args:
db: The database session.
event: An a11y event to be written.
perf_q: A queue for collecting performance data.
"""
assert event.type == "a11y", event
crud.insert_a11y_event(db, event.data)
perf_q.put((event.type, event.timestamp, utils.get_timestamp()))


Expand Down Expand Up @@ -696,6 +740,7 @@ def read_window_events(
terminate_processing: multiprocessing.Event,
recording: Recording,
started_counter: multiprocessing.Value,
window_event_by_id: dict,
) -> None:
"""Read window events and add them to the event queue.

Expand All @@ -710,6 +755,7 @@ def read_window_events(
logger.info("Starting")
prev_window_data = {}
started = False
a11y_counter = 0
while not terminate_processing.is_set():
window_data = window.get_active_window_data()
if not window_data:
Expand All @@ -721,27 +767,41 @@ def read_window_events(
started = True

if window_data["title"] != prev_window_data.get("title") or window_data[
"window_id"
] != prev_window_data.get("window_id"):
"handle"
] != prev_window_data.get("handle"):
# TODO: fix exception sometimes triggered by the next line on win32:
# File "\Python39\lib\threading.py" line 917, in run
# File "...\openadapt\record.py", line 277, in read window events
# File "...\env\lib\site-packages\loguru\logger.py" line 1977, in info
# File "...\env\lib\site-packages\loguru\_logger.py", line 1964, in _log
# for handler in core.handlers.values):
# RuntimeError: dictionary changed size during iteration
_window_data = window_data
_window_data = window_data.copy()
_window_data.pop("state")
logger.info(f"{_window_data=}")
a11y_counter = 0
if window_data != prev_window_data:
logger.debug("Queuing window event for writing")
event_q.put(
Event(
utils.get_timestamp(),
"window",
window_data,
)
a11y_counter += 1
window_data.update({"a11y_counter": a11y_counter})
_window_data = window_data.copy()
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved
_window_data.pop("state", None)
window_event = Event(
utils.get_timestamp(),
"window",
_window_data,
)
event_q.put(window_event)
a11y_event = Event(
utils.get_timestamp(),
"a11y",
window_data,
)
window_event_by_id[(window_data["handle"], window_data["a11y_counter"])] = (
a11y_event # Store a11y event in map
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved
)
event_q.put(a11y_event)

prev_window_data = window_data


Expand Down Expand Up @@ -1175,6 +1235,7 @@ def record(
screen_write_q = sq.SynchronizedQueue()
action_write_q = sq.SynchronizedQueue()
window_write_q = sq.SynchronizedQueue()
a11y_write_q = sq.SynchronizedQueue()
video_write_q = sq.SynchronizedQueue()
# TODO: save write times to DB; display performance plot in visualize.py
perf_q = sq.SynchronizedQueue()
Expand All @@ -1183,9 +1244,17 @@ def record(
started_counter = multiprocessing.Value("i", 0)
expected_starts = 9

window_event_by_id = {}
Animesh404 marked this conversation as resolved.
Show resolved Hide resolved

window_event_reader = threading.Thread(
target=read_window_events,
args=(event_q, terminate_processing, recording, started_counter),
args=(
event_q,
terminate_processing,
recording,
started_counter,
window_event_by_id,
),
)
window_event_reader.start()

Expand All @@ -1210,6 +1279,7 @@ def record(
num_action_events = multiprocessing.Value("i", 0)
num_screen_events = multiprocessing.Value("i", 0)
num_window_events = multiprocessing.Value("i", 0)
num_a11y_events = multiprocessing.Value("i", 0)
num_video_events = multiprocessing.Value("i", 0)

event_processor = threading.Thread(
Expand All @@ -1219,6 +1289,7 @@ def record(
screen_write_q,
action_write_q,
window_write_q,
a11y_write_q,
video_write_q,
perf_q,
recording,
Expand All @@ -1227,7 +1298,9 @@ def record(
num_screen_events,
num_action_events,
num_window_events,
num_a11y_events,
num_video_events,
window_event_by_id,
),
)
event_processor.start()
Expand Down Expand Up @@ -1277,6 +1350,21 @@ def record(
)
window_event_writer.start()

a11y_event_writer = multiprocessing.Process(
target=write_events,
args=(
"a11y",
write_a11y_event,
a11y_write_q,
num_a11y_events,
perf_q,
recording,
terminate_processing,
started_counter,
),
)
a11y_event_writer.start()

if config.RECORD_VIDEO:
expected_starts += 1
video_writer = multiprocessing.Process(
Expand Down Expand Up @@ -1379,7 +1467,9 @@ def record(
screen_event_writer.join()
action_event_writer.join()
window_event_writer.join()
# Join a11y_event_writer
if config.RECORD_VIDEO:
a11y_event_writer.join()
video_writer.join()
if config.RECORD_AUDIO:
audio_recorder.join()
Expand Down
Loading
Loading